{"id":"https://openalex.org/W2792511626","doi":"https://doi.org/10.1145/3171221.3171280","title":"DNN-HMM based Automatic Speech Recognition for HRI Scenarios","display_name":"DNN-HMM based Automatic Speech Recognition for HRI Scenarios","publication_year":2018,"publication_date":"2018-02-26","ids":{"openalex":"https://openalex.org/W2792511626","doi":"https://doi.org/10.1145/3171221.3171280","mag":"2792511626"},"language":"en","primary_location":{"id":"doi:10.1145/3171221.3171280","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3171221.3171280","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3171280&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 ACM/IEEE International Conference on Human-Robot Interaction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dl.acm.org/ft_gateway.cfm?id=3171280&type=pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103827948","display_name":"Jos\u00e9 N\u00f3voa","orcid":null},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Novoa","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055118748","display_name":"Jorge Wuth","orcid":null},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Jorge Wuth","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103769815","display_name":"Juan Pablo Escudero","orcid":"https://orcid.org/0000-0002-7613-027X"},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Juan Pablo Escudero","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013929728","display_name":"Josu\u00e9 Fredes","orcid":"https://orcid.org/0000-0002-9614-4193"},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Josu\u00e9 Fredes","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007921391","display_name":"Rodrigo Mah\u00fa","orcid":"https://orcid.org/0000-0002-6374-8003"},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"Rodrigo Mahu","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029824436","display_name":"N\u00e9stor Becerra Yoma","orcid":"https://orcid.org/0000-0002-3052-4687"},"institutions":[{"id":"https://openalex.org/I69737025","display_name":"University of Chile","ror":"https://ror.org/047gc3g35","country_code":"CL","type":"education","lineage":["https://openalex.org/I69737025"]}],"countries":["CL"],"is_corresponding":false,"raw_author_name":"N\u00e9stor Becerra Yoma","raw_affiliation_strings":["University of Chile, Santiago, Chile"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Chile, Santiago, Chile","institution_ids":["https://openalex.org/I69737025"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.5618,"has_fulltext":true,"cited_by_count":50,"citation_normalized_percentile":{"value":0.95631476,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"150","last_page":"159"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7770402431488037},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.7737293243408203},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7348899841308594},{"id":"https://openalex.org/keywords/loudspeaker","display_name":"Loudspeaker","score":0.5353757739067078},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.49285030364990234},{"id":"https://openalex.org/keywords/acoustic-model","display_name":"Acoustic model","score":0.48538243770599365},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.45342516899108887},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43040966987609863},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4238881468772888},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4144817292690277},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.41351762413978577},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.33363020420074463},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13029909133911133}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7770402431488037},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.7737293243408203},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7348899841308594},{"id":"https://openalex.org/C157138929","wikidata":"https://www.wikidata.org/wiki/Q570","display_name":"Loudspeaker","level":2,"score":0.5353757739067078},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.49285030364990234},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.48538243770599365},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.45342516899108887},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43040966987609863},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4238881468772888},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4144817292690277},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.41351762413978577},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.33363020420074463},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13029909133911133},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3171221.3171280","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3171221.3171280","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3171280&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 ACM/IEEE International Conference on Human-Robot Interaction","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3171221.3171280","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3171221.3171280","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=3171280&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 ACM/IEEE International Conference on Human-Robot Interaction","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7400000095367432,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G3868974132","display_name":null,"funder_award_id":"Doctorado Nacional/2014","funder_id":"https://openalex.org/F4320334812","funder_display_name":"Comisi\u00f3n Nacional de Investigaci\u00f3n Cient\u00edfica y Tecnol\u00f3gica"},{"id":"https://openalex.org/G7912527284","display_name":null,"funder_award_id":"62909-17-1-2002","funder_id":"https://openalex.org/F4320338298","funder_display_name":"Office of Naval Research Global"},{"id":"https://openalex.org/G8687987819","display_name":null,"funder_award_id":"PCHA/Doctorado Nacional/2014","funder_id":"https://openalex.org/F4320334812","funder_display_name":"Comisi\u00f3n Nacional de Investigaci\u00f3n Cient\u00edfica y Tecnol\u00f3gica"}],"funders":[{"id":"https://openalex.org/F4320334812","display_name":"Comisi\u00f3n Nacional de Investigaci\u00f3n Cient\u00edfica y Tecnol\u00f3gica","ror":"https://ror.org/02ap3w078"},{"id":"https://openalex.org/F4320338298","display_name":"Office of Naval Research Global","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2792511626.pdf","grobid_xml":"https://content.openalex.org/works/W2792511626.grobid-xml"},"referenced_works_count":81,"referenced_works":["https://openalex.org/W187434241","https://openalex.org/W378169066","https://openalex.org/W565449262","https://openalex.org/W1491238342","https://openalex.org/W1494910745","https://openalex.org/W1502984613","https://openalex.org/W1517606245","https://openalex.org/W1524333225","https://openalex.org/W1541457182","https://openalex.org/W1563168000","https://openalex.org/W1569827162","https://openalex.org/W1590327792","https://openalex.org/W1602122992","https://openalex.org/W1888831092","https://openalex.org/W1909727437","https://openalex.org/W1968531668","https://openalex.org/W1979590659","https://openalex.org/W1994396704","https://openalex.org/W1995562189","https://openalex.org/W2007223396","https://openalex.org/W2034587361","https://openalex.org/W2038118634","https://openalex.org/W2056489736","https://openalex.org/W2063703533","https://openalex.org/W2064675550","https://openalex.org/W2072933891","https://openalex.org/W2077541282","https://openalex.org/W2078958793","https://openalex.org/W2096769774","https://openalex.org/W2099739380","https://openalex.org/W2108703536","https://openalex.org/W2112632589","https://openalex.org/W2129578073","https://openalex.org/W2131342762","https://openalex.org/W2136922672","https://openalex.org/W2138780138","https://openalex.org/W2143612262","https://openalex.org/W2156376728","https://openalex.org/W2158791054","https://openalex.org/W2160145433","https://openalex.org/W2160815625","https://openalex.org/W2291522532","https://openalex.org/W2342425527","https://openalex.org/W2342963907","https://openalex.org/W2343019076","https://openalex.org/W2343820197","https://openalex.org/W2343991816","https://openalex.org/W2398058106","https://openalex.org/W2403891327","https://openalex.org/W2412588858","https://openalex.org/W2475988411","https://openalex.org/W2512877744","https://openalex.org/W2515753980","https://openalex.org/W2515863432","https://openalex.org/W2517914016","https://openalex.org/W2519224033","https://openalex.org/W2526529994","https://openalex.org/W2556673367","https://openalex.org/W2561606595","https://openalex.org/W2565501058","https://openalex.org/W2589530322","https://openalex.org/W2591355762","https://openalex.org/W2591917595","https://openalex.org/W2593216051","https://openalex.org/W2597001495","https://openalex.org/W2604292070","https://openalex.org/W2622203030","https://openalex.org/W2745951259","https://openalex.org/W2781822585","https://openalex.org/W2915722758","https://openalex.org/W2963490782","https://openalex.org/W3023745411","https://openalex.org/W3147069478","https://openalex.org/W3148186152","https://openalex.org/W3215366012","https://openalex.org/W4205559380","https://openalex.org/W4234389704","https://openalex.org/W4248546571","https://openalex.org/W4250969944","https://openalex.org/W4365799809","https://openalex.org/W4376453519"],"related_works":["https://openalex.org/W3081187864","https://openalex.org/W151018310","https://openalex.org/W3080136773","https://openalex.org/W4380605396","https://openalex.org/W2584084702","https://openalex.org/W3133352777","https://openalex.org/W2008737763","https://openalex.org/W3012383599","https://openalex.org/W4385611764","https://openalex.org/W172230311"],"abstract_inverted_index":{"In":[0,146],"this":[1,39,147],"paper,":[2],"we":[3],"propose":[4],"to":[5],"replace":[6],"the":[7,21,24,31,43,65,93,130,143,151,177],"classical":[8],"black":[9],"box":[10],"integration":[11],"of":[12,23,113,129,190],"automatic":[13,57,153],"speech":[14,58,103,154,173],"recognition":[15,59,104,155,174],"technology":[16],"in":[17,91],"HRI":[18,25,75,99,149],"applications":[19],"with":[20,64,78,176,186],"incorporation":[22],"environment":[26,44],"representation":[27,45],"and":[28,30,33,36,46,68,119,137,140,167,181],"modeling,":[29],"robot":[32],"user":[34],"states":[35],"contexts.":[37],"Accordingly,":[38],"paper":[40],"focuses":[41],"on":[42,127],"modeling":[47],"by":[48,109],"training":[49,89,191],"a":[50,79,88,117,123,158,187],"deep":[51],"neural":[52],"network-hidden":[53],"Markov":[54],"model":[55],"based":[56],"engine":[60,156],"combining":[61],"clean":[62],"utterances":[63],"acoustic-channel":[66],"responses":[67],"noise":[69],"that":[70,162],"were":[71,107],"obtained":[72],"from":[73,142],"an":[74,98],"testbed":[76],"built":[77],"PR2":[80,131],"mobile":[81],"manipulation":[82],"robot.":[83],"This":[84],"method":[85],"avoids":[86],"recording":[87,110],"database":[90],"all":[92],"possible":[94],"acoustic":[95],"environments":[96],"given":[97],"scenario.":[100],"Moreover,":[101],"different":[102],"testing":[105,183],"conditions":[106],"produced":[108],"two":[111],"types":[112],"acoustics":[114],"sources,":[115],"i.e.":[116],"loudspeaker":[118],"human":[120,182],"speakers,":[121],"using":[122],"Microsoft":[124],"Kinect":[125],"mounted":[126],"top":[128],"robot,":[132],"while":[133],"performing":[134],"head":[135],"rotations":[136],"movements":[138],"towards":[139],"away":[141],"fixed":[144],"sources.":[145],"generic":[148],"scenario,":[150],"resulting":[152],"provided":[157],"word":[159],"error":[160],"rate":[161],"is":[163],"at":[164],"least":[165],"26%":[166],"38%":[168],"lower":[169],"than":[170],"publicly":[171],"available":[172],"APIs":[175],"playback":[178],"(i.e.":[179],"loudspeaker)":[180],"databases,":[184],"respectively,":[185],"limited":[188],"amount":[189],"data.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
