{"id":"https://openalex.org/W4390481136","doi":"https://doi.org/10.1109/humanoids57100.2023.10375198","title":"An Audio-Video Sensor Fusion Framework To Augment Humanoid Capabilities For Identifying And Interacting With Human Conversational Partners","display_name":"An Audio-Video Sensor Fusion Framework To Augment Humanoid Capabilities For Identifying And Interacting With Human Conversational Partners","publication_year":2023,"publication_date":"2023-12-12","ids":{"openalex":"https://openalex.org/W4390481136","doi":"https://doi.org/10.1109/humanoids57100.2023.10375198"},"language":"en","primary_location":{"id":"doi:10.1109/humanoids57100.2023.10375198","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/humanoids57100.2023.10375198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE-RAS 22nd International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092543513","display_name":"Pranav Barot","orcid":"https://orcid.org/0009-0001-5078-7660"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Pranav Barot","raw_affiliation_strings":["University of Waterloo,Department of Systems Design Engineering,Canada","Department of Systems Design Engineering, University of Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo,Department of Systems Design Engineering,Canada","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"Department of Systems Design Engineering, University of Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054678574","display_name":"Ewen MacDonald","orcid":"https://orcid.org/0000-0002-6973-2926"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ewen N. MacDonald","raw_affiliation_strings":["University of Waterloo,Department of Systems Design Engineering,Canada","Department of Systems Design Engineering, University of Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo,Department of Systems Design Engineering,Canada","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"Department of Systems Design Engineering, University of Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042406934","display_name":"Katja Mombaur","orcid":"https://orcid.org/0000-0003-1353-0943"},"institutions":[{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]},{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]},{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["CA","DE","US"],"is_corresponding":false,"raw_author_name":"Katja Mombaur","raw_affiliation_strings":["Karlsruhe Institute of Technology (KIT), Institute of Anthropomatics and Robotics (IAR),Optimization and Biomechanics for Human-Centred Robotics, Karlsruhe, Germany and CERC Human-Centred Robotics and Machine Intelligence,Department of Systems Design Engineering, University of Waterloo,Waterloo,Canada","Department of Systems Design Engineering, University of Waterloo, Optimization and Biomechanics for Human-Centred Robotics, Karlsruhe, Germany and CERC Human-Centred Robotics and Machine Intelligence, Karlsruhe Institute of Technology (KIT), Institute of Anthropomatics and Robotics (IAR), Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"Karlsruhe Institute of Technology (KIT), Institute of Anthropomatics and Robotics (IAR),Optimization and Biomechanics for Human-Centred Robotics, Karlsruhe, Germany and CERC Human-Centred Robotics and Machine Intelligence,Department of Systems Design Engineering, University of Waterloo,Waterloo,Canada","institution_ids":["https://openalex.org/I4210116723"]},{"raw_affiliation_string":"Department of Systems Design Engineering, University of Waterloo, Optimization and Biomechanics for Human-Centred Robotics, Karlsruhe, Germany and CERC Human-Centred Robotics and Machine Intelligence, Karlsruhe Institute of Technology (KIT), Institute of Anthropomatics and Robotics (IAR), Waterloo, Canada","institution_ids":["https://openalex.org/I102335020","https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5092543513"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":0.2038,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49170579,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9811000227928162,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9811000227928162,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9460999965667725,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9416000247001648,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.8835763931274414},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7375834584236145},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.6822522878646851},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5807895660400391},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.5347949862480164},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.5048549771308899},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.448851615190506},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3483829200267792}],"concepts":[{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.8835763931274414},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7375834584236145},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.6822522878646851},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5807895660400391},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.5347949862480164},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.5048549771308899},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.448851615190506},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3483829200267792}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/humanoids57100.2023.10375198","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/humanoids57100.2023.10375198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE-RAS 22nd International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1558428197","https://openalex.org/W2011502221","https://openalex.org/W2044924490","https://openalex.org/W2077124340","https://openalex.org/W2104484061","https://openalex.org/W2161129698","https://openalex.org/W2188890360","https://openalex.org/W2542505220","https://openalex.org/W2737707020","https://openalex.org/W2802511003","https://openalex.org/W2999527441","https://openalex.org/W3107599441","https://openalex.org/W4385249303","https://openalex.org/W4390496134","https://openalex.org/W6687041400"],"related_works":["https://openalex.org/W1569471492","https://openalex.org/W2978665606","https://openalex.org/W4287179229","https://openalex.org/W4293926484","https://openalex.org/W3205513966","https://openalex.org/W3120459843","https://openalex.org/W4366547574","https://openalex.org/W3200191727","https://openalex.org/W189465620","https://openalex.org/W4366818884"],"abstract_inverted_index":{"Human":[0],"robot":[1],"interaction":[2],"often":[3],"requires":[4],"many":[5],"sub-systems":[6,47],"to":[7,12,52,57],"work":[8],"together":[9],"in":[10,39,61],"order":[11],"facilitate":[13],"more":[14,111],"natural":[15],"and":[16,30,67,110],"intelligent":[17],"interactions":[18],"with":[19],"multiple":[20],"humans.":[21],"For":[22],"this":[23],"work,":[24],"the":[25,87],"relevant":[26,83],"systems":[27],"include":[28],"audio":[29],"visual":[31],"direction":[32],"of":[33,78],"arrival":[34],"estimation":[35],"that":[36],"are":[37,48],"used":[38,49],"an":[40],"encompassing":[41],"sensor":[42],"fusion":[43],"framework.":[44],"The":[45],"presented":[46],"concurrently":[50],"online":[51],"allow":[53],"for":[54,106],"humanoid":[55,108],"robots":[56],"identify":[58,68],"active":[59],"speakers":[60],"a":[62,103],"scene,":[63],"track":[64],"human":[65],"subjects,":[66],"when":[69],"other":[70],"subjects":[71],"may":[72],"require":[73],"attention.":[74],"We":[75],"present":[76],"evaluations":[77],"performance,":[79],"while":[80],"also":[81],"implementing":[82],"humanlike":[84],"behaviours":[85],"on":[86,98],"REEM-C":[88],"Humanoid":[89],"Robot.":[90],"A":[91],"conducted":[92],"user":[93],"study":[94],"delivers":[95],"valuable":[96],"feedback":[97],"these":[99],"systems,":[100],"which":[101],"provide":[102],"strong":[104],"foundation":[105],"improved":[107],"intelligence":[109],"innovative":[112],"human-robot":[113],"interaction.":[114]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
