{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,13]],"date-time":"2024-09-13T04:36:50Z","timestamp":1726202210103},"publisher-location":"Cham","reference-count":36,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031357077"},{"type":"electronic","value":"9783031357084"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-35708-4_26","type":"book-chapter","created":{"date-parts":[[2023,7,8]],"date-time":"2023-07-08T19:04:57Z","timestamp":1688843097000},"page":"355-365","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["A Comparative Analysis of Real Time Open-Source Speech Recognition Tools for Social Robots"],"prefix":"10.1007","author":[{"ORCID":"http:\/\/orcid.org\/0000-0001-6426-7124","authenticated-orcid":false,"given":"Akshara","family":"Pande","sequence":"first","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0001-9513-2046","authenticated-orcid":false,"given":"Bhanu","family":"Shrestha","sequence":"additional","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0003-4500-290X","authenticated-orcid":false,"given":"Anshul","family":"Rani","sequence":"additional","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0001-5144-3811","authenticated-orcid":false,"given":"Deepti","family":"Mishra","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,7,9]]},"reference":[{"key":"26_CR1","doi-asserted-by":"publisher","first-page":"564","DOI":"10.1016\/j.procs.2017.10.064","volume":"116","author":"W Budiharto","year":"2017","unstructured":"Budiharto, W., et al.: EduRobot: intelligent humanoid robot with natural interaction for education and entertainment. Procedia Comput. Sci. 116, 564\u2013570 (2017)","journal-title":"Procedia Comput. Sci."},{"key":"26_CR2","unstructured":"Childers, M., et al.: US army research laboratory (ARL) robotics collaborative technology alliance 2014 capstone experiment. US Army Research Laboratory Aberdeen Proving Ground United States (2016)"},{"issue":"1","key":"26_CR3","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1109\/TCSS.2019.2922593","volume":"7","author":"BA Erol","year":"2019","unstructured":"Erol, B.A., et al.: Toward artificial emotional intelligence for cooperative social human\u2013machine interaction. IEEE Trans. Comput. Soc. Syst. 7(1), 234\u2013246 (2019)","journal-title":"IEEE Trans. Comput. Soc. Syst."},{"key":"26_CR4","doi-asserted-by":"crossref","unstructured":"Ahn, H.S., Lee, M.H., MacDonald, B.A.: Healthcare robot systems for a hospital environment: CareBot and ReceptionBot. In: 24th IEEE International Symposium on Robot and Human Interactive Communication (RO-MAN), Kobe, Japan, pp. 571\u2013576 (2015)","DOI":"10.1109\/ROMAN.2015.7333621"},{"key":"26_CR5","series-title":"Advances in Intelligent Systems and Computing","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1007\/978-3-319-74690-6_58","volume-title":"The International Conference on Advanced Machine Learning Technologies and Applications (AMLTA2018)","author":"IA Hameed","year":"2018","unstructured":"Hameed, I.A., Strazdins, G., Hatlemark, H.A.M., Jakobsen, I.S., Damdam, J.O.: Robots that can mix serious with fun. In: Hassanien, A.E., Tolba, M.F., Elhoseny, M., Mostafa, M. (eds.) AMLTA 2018. AISC, vol. 723, pp. 595\u2013604. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-74690-6_58"},{"key":"26_CR6","doi-asserted-by":"publisher","first-page":"19143","DOI":"10.1109\/ACCESS.2019.2896880","volume":"7","author":"AB Nassif","year":"2019","unstructured":"Nassif, A.B., et al.: Speech recognition using deep neural networks: a systematic review. IEEE Access 7, 19143\u201319165 (2019)","journal-title":"IEEE Access"},{"key":"26_CR7","doi-asserted-by":"crossref","unstructured":"Rahat, S.A., Imteaj, A., Rahman, T.: An IoT based interactive speech recognizable robot with distance control using Raspberry Pi. In: 2018 International Conference on Innovations in Science, Engineering and Technology (ICISET). IEEE (2018)","DOI":"10.1109\/ICISET.2018.8745656"},{"key":"26_CR8","doi-asserted-by":"crossref","unstructured":"Vacher, M., et al.: Complete sound and speech recognition system for health smart homes: application to the recognition of activities of daily living. In: Domenico, C. (ed.) New Developments in Biomedical Engineering, pp. 645\u2013673. In-Tech (2010)","DOI":"10.5772\/7596"},{"key":"26_CR9","doi-asserted-by":"publisher","first-page":"958624","DOI":"10.3389\/frobt.2022.958624","volume":"9","author":"R van den Berghe","year":"2022","unstructured":"van den Berghe, R.: Social robots in a translanguaging pedagogy: a review to identify opportunities for robot-assisted (language) learning. Front. Robot. AI 9, 958624 (2022)","journal-title":"Front. Robot. AI"},{"issue":"1","key":"26_CR10","first-page":"1","volume":"9","author":"N Randall","year":"2019","unstructured":"Randall, N.: A survey of robot-assisted language learning (RALL). ACM Trans. Hum.-Robot Interact. (THRI) 9(1), 1\u201336 (2019)","journal-title":"ACM Trans. Hum.-Robot Interact. (THRI)"},{"key":"26_CR11","doi-asserted-by":"crossref","unstructured":"Taniguchi, T., et al.: Language and robotics. Frontiers Media SA, p. 674832 (2021)","DOI":"10.3389\/frobt.2021.674832"},{"key":"26_CR12","unstructured":"Forsberg, M.: Why is speech recognition difficult. Chalmers University of Technology (2003)"},{"key":"26_CR13","doi-asserted-by":"crossref","unstructured":"Mubin, O., Henderson, J., Bartneck, C.: You just do not understand me! Speech recognition in human robot interaction. In: The 23rd IEEE International Symposium on Robot and Human Interactive Communication. IEEE (2014)","DOI":"10.1109\/ROMAN.2014.6926324"},{"issue":"9","key":"26_CR14","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1145\/348941.348990","volume":"43","author":"B Shneiderman","year":"2000","unstructured":"Shneiderman, B.: The limits of speech recognition. Commun. ACM 43(9), 63\u201365 (2000)","journal-title":"Commun. ACM"},{"key":"26_CR15","unstructured":"McCowan, I.A., et al.: On the use of information retrieval measures for speech recognition evaluation. IDIAP (2004)"},{"key":"26_CR16","doi-asserted-by":"crossref","unstructured":"Kennedy, J., et al.: Child speech recognition in human-robot interaction: evaluations and recommendations. In: 2017 12th ACM\/IEEE International Conference on Human-Robot Interaction (HRI) (2017)","DOI":"10.1145\/2909824.3020229"},{"key":"26_CR17","doi-asserted-by":"crossref","unstructured":"Attawibulkul, S., Kaewkamnerdpong, B., Miyanaga, Y.: Noisy speech training in MFCC-based speech recognition with noise suppression toward robot assisted autism therapy. In: 2017 10th Biomedical Engineering International Conference (BMEiCON). IEEE (2017)","DOI":"10.1109\/BMEiCON.2017.8229135"},{"issue":"2","key":"26_CR18","doi-asserted-by":"publisher","first-page":"607","DOI":"10.1109\/TII.2016.2625818","volume":"13","author":"K Zinchenko","year":"2017","unstructured":"Zinchenko, K., Wu, C.Y., Song, K.T.: A study on speech recognition control for a surgical robot. IEEE Trans. Ind. Inf. 13(2), 607\u2013615 (2017)","journal-title":"IEEE Trans. Ind. Inf."},{"issue":"3","key":"26_CR19","doi-asserted-by":"publisher","first-page":"759","DOI":"10.1109\/TRO.2008.919305","volume":"24","author":"CT Ishi","year":"2008","unstructured":"Ishi, C.T., et al.: A robust speech recognition system for communication robots in noisy environments. IEEE Trans. Robot. 24(3), 759\u2013763 (2008)","journal-title":"IEEE Trans. Robot."},{"key":"26_CR20","doi-asserted-by":"publisher","first-page":"1185","DOI":"10.1007\/s10803-009-0737-0","volume":"39","author":"N Russo","year":"2009","unstructured":"Russo, N., et al.: Effects of background noise on cortical encoding of speech in autism spectrum disorders. J. Autism Dev. Disord. 39, 1185\u20131196 (2009)","journal-title":"J. Autism Dev. Disord."},{"issue":"6","key":"26_CR21","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1109\/MITP.2010.147","volume":"12","author":"KW Miller","year":"2010","unstructured":"Miller, K.W., Voas, J., Costello, T.: Free and open source software. IT Prof. 12(6), 14\u201316 (2010)","journal-title":"IT Prof."},{"key":"26_CR22","doi-asserted-by":"crossref","unstructured":"Weber, S., Luo, J.: What makes an open source code popular on Git hub?. In: 2014 IEEE International Conference on Data Mining Workshop (2014)","DOI":"10.1109\/ICDMW.2014.55"},{"key":"26_CR23","unstructured":"Speech Recognition homepage. https:\/\/pypi.org\/project\/SpeechRecognition\/. Accessed 11 Jan 2023"},{"key":"26_CR24","unstructured":"DeepSpeech homepage. https:\/\/deepspeech.readthedocs.io\/en\/r0.9\/. Accessed 11 Jan 2023"},{"key":"26_CR25","unstructured":"Vosk homepage. https:\/\/pypi.org\/project\/vosk\/. Accessed 11 Jan 2023"},{"key":"26_CR26","doi-asserted-by":"crossref","unstructured":"Cavazza, M.: An empirical study of speech recognition errors in a task-oriented dialogue system. In: Proceedings of the Second SIGdial Workshop on Discourse and Dialogue (2001)","DOI":"10.3115\/1118078.1118084"},{"key":"26_CR27","doi-asserted-by":"crossref","unstructured":"Saon, G., Ramabhadran, B., Zweig, G.: On the effect of word error rate on automated quality monitoring. In: 2006 IEEE Spoken Language Technology Workshop. IEEE (2006)","DOI":"10.1109\/SLT.2006.326828"},{"key":"26_CR28","series-title":"IFIP Advances in Information and Communication Technology","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1007\/978-3-030-49161-1_7","volume-title":"Artificial Intelligence Applications and Innovations","author":"F Filippidou","year":"2020","unstructured":"Filippidou, F., Moussiades, L.: \u0391 benchmarking of IBM, google and wit automatic speech recognition systems. In: Maglogiannis, I., Iliadis, L., Pimenidis, E. (eds.) AIAI 2020. IAICT, vol. 583, pp. 73\u201382. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-49161-1_7"},{"key":"26_CR29","unstructured":"Match Error Rate homepage. https:\/\/torchmetrics.readthedocs.io\/en\/stable\/text\/match_error_rate.html. Accessed 11 Jan 2023"},{"key":"26_CR30","unstructured":"WORD INFO. LOST homepage. https:\/\/torchmetrics.readthedocs.io\/en\/stable\/text\/word_info_lost.html. Accessed 11 Jan 2023"},{"key":"26_CR31","unstructured":"CHAR ERROR RATE homepage. https:\/\/torchmetrics.readthedocs.io\/en\/stable\/text\/char_error_rate.html#:~:text=character%20error%20rate%20is%20a. Accessed 11 Jan 2023"},{"key":"26_CR32","unstructured":"https:\/\/en.wikipedia.org\/wiki\/Speech_recognition"},{"issue":"03","key":"26_CR33","first-page":"20","volume":"7","author":"V K\u00ebpuska","year":"2017","unstructured":"K\u00ebpuska, V., Bohouta, G.: Comparing speech recognition systems (Microsoft API, Google API and CMU Sphinx). Int. J. Eng. Res. Appl. 7(03), 20\u201324 (2017)","journal-title":"Int. J. Eng. Res. Appl."},{"key":"26_CR34","doi-asserted-by":"crossref","unstructured":"Morris, A.C., Maier, V., Green, P.: From WER and RIL to MER and WIL: improved evaluation measures for connected speech recognition. In: Eighth International Conference on Spoken Language Processing (2004)","DOI":"10.21437\/Interspeech.2004-668"},{"key":"26_CR35","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1007\/978-3-642-41491-6_29","volume-title":"Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data","author":"P Wang","year":"2013","unstructured":"Wang, P., Sun, R., Zhao, H., Yu, K.: A new word language model evaluation metric for character based languages. In: Sun, M., Zhang, M., Lin, D., Wang, H. (eds.) CCL\/NLP-NABD -2013. LNCS (LNAI), vol. 8202, pp. 315\u2013324. Springer, Heidelberg (2013). https:\/\/doi.org\/10.1007\/978-3-642-41491-6_29"},{"key":"26_CR36","doi-asserted-by":"publisher","first-page":"3515","DOI":"10.1109\/TASLP.2021.3126949","volume":"29","author":"L Sar\u0131","year":"2021","unstructured":"Sar\u0131, L., Hasegawa-Johnson, M., Yoo, C.D.: Counterfactually fair automatic speech recognition. IEEE\/ACM Trans. Audio Speech Lang. Process. 29, 3515\u20133525 (2021)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."}],"container-title":["Lecture Notes in Computer Science","Design, User Experience, and Usability"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-35708-4_26","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,8]],"date-time":"2023-07-08T19:16:26Z","timestamp":1688843786000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-35708-4_26"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031357077","9783031357084"],"references-count":36,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-35708-4_26","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"9 July 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"HCII","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Human-Computer Interaction","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Copenhagen","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Denmark","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 July 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 July 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"hcii2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2023.hci.international\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMS","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"7472","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1578","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"396","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"21% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}