{"id":"https://openalex.org/W7156993178","doi":"https://doi.org/10.48550/arxiv.2604.23927","title":"Towards Localizing Conversation Partners using Head Motion","display_name":"Towards Localizing Conversation Partners using Head Motion","publication_year":2026,"publication_date":"2026-04-27","ids":{"openalex":"https://openalex.org/W7156993178","doi":"https://doi.org/10.48550/arxiv.2604.23927"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.23927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.23927","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075681305","display_name":"Payal Mohapatra","orcid":"https://orcid.org/0000-0002-3534-9136"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohapatra, Payal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071106886","display_name":"Calvin Murdock","orcid":"https://orcid.org/0000-0002-9560-4506"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Murdock, Calvin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058219648","display_name":"Ali Aroudi","orcid":"https://orcid.org/0000-0001-5770-0858"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aroudi, Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037474835","display_name":"Ishwarya Ananthabhotla","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ananthabhotla, Ishwarya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042577114","display_name":"Anjali Menon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Menon, Anjali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040562171","display_name":"Buye Xu","orcid":"https://orcid.org/0000-0002-3027-7567"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Buye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134806765","display_name":"Morteza Khaleghimeybodi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khaleghimeybodi, Morteza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.33649998903274536,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.33649998903274536,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.2581000030040741,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.11640000343322754,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.9186000227928162},{"id":"https://openalex.org/keywords/active-listening","display_name":"Active listening","score":0.636900007724762},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4156999886035919},{"id":"https://openalex.org/keywords/wearable-computer","display_name":"Wearable computer","score":0.3944999873638153},{"id":"https://openalex.org/keywords/inertial-measurement-unit","display_name":"Inertial measurement unit","score":0.382099986076355},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.37770000100135803},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.3553999960422516},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.32409998774528503}],"concepts":[{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.9186000227928162},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7164999842643738},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.636900007724762},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.420199990272522},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41499999165534973},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4140999913215637},{"id":"https://openalex.org/C150594956","wikidata":"https://www.wikidata.org/wiki/Q1334829","display_name":"Wearable computer","level":2,"score":0.3944999873638153},{"id":"https://openalex.org/C79061980","wikidata":"https://www.wikidata.org/wiki/Q941680","display_name":"Inertial measurement unit","level":2,"score":0.382099986076355},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.3553999960422516},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.32409998774528503},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C54290928","wikidata":"https://www.wikidata.org/wiki/Q4845080","display_name":"Wearable technology","level":3,"score":0.2992999851703644},{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2906999886035919},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2824000120162964},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.2637999951839447},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.26170000433921814}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.23927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.23927","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23927","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Many":[0],"individuals":[1],"struggle":[2],"to":[3,16,27,34,45,50,73,93,140,148],"understand":[4],"conversation":[5,31,149,162,184,241],"partners":[6,185],"in":[7,40,80,124,235],"noisy":[8,81,237],"settings,":[9],"particularly":[10],"amid":[11],"background":[12],"speakers":[13],"or":[14],"due":[15],"hearing":[17],"impairments.":[18],"Emerging":[19],"wearables":[20],"like":[21],"smartglasses":[22],"offer":[23],"a":[24,96,118,130,155,167,194,222],"transformative":[25],"opportunity":[26],"enhance":[28],"speech":[29,225],"from":[30],"partners.":[32,242],"Crucial":[33],"this":[35,176],"is":[36],"identifying":[37],"the":[38,42,52,65,104,159,181],"direction":[39,66],"which":[41,47,179],"user":[43],"wants":[44],"listen,":[46],"we":[48],"refer":[49],"as":[51,117],"user's":[53,97],"acoustic":[54,98,132],"zones":[55,99,123,144],"of":[56,67,100,106,145,158,161,183],"interest.":[57,101],"While":[58],"current":[59],"spatial":[60],"audio-based":[61],"methods":[62],"can":[63],"resolve":[64],"vocal":[68],"input,":[69],"they":[70],"are":[71,91],"agnostic":[72],"listening":[74],"preferences":[75],"and":[76,193,199,210,212],"have":[77],"limited":[78],"functionality":[79],"settings":[82,238],"with":[83,177,239],"interfering":[84],"speakers.":[85],"To":[86],"address":[87],"this,":[88],"behavioral":[89],"cues":[90],"needed":[92],"actively":[94],"infer":[95,142],"We":[102,127,174,203,219],"explore":[103],"effectiveness":[105],"head-orienting":[107],"behavior,":[108],"captured":[109],"by":[110],"Inertial":[111],"Measurement":[112],"Units":[113],"(IMUs)":[114],"on":[115],"smartglasses,":[116],"modality":[119],"for":[120,207],"localizing":[121],"these":[122],"seated":[125],"conversations.":[126],"introduce":[128],"HALo,":[129],"head-orientation-based":[131,230],"zone":[133],"localization":[134,231],"network":[135],"that":[136,229],"leverages":[137],"smartglasses'":[138],"IMUs":[139],"non-invasively":[141],"auditory":[143],"interest":[146],"corresponding":[147],"partner":[150],"locations.":[151],"By":[152],"integrating":[153],"an":[154],"priori":[156],"estimate":[157],"number":[160,182],"partners,":[163],"our":[164],"approach":[165],"yields":[166],"21%":[168],"performance":[169],"improvement":[170],"over":[171,197,216],"existing":[172],"methods.":[173],"complement":[175],"CoCo,":[178],"classifies":[180],"using":[186],"only":[187],"IMU":[188],"data,":[189],"achieving":[190],"0.74":[191],"accuracy":[192],"35%":[195],"gain":[196],"rule-based":[198],"generic":[200],"time-series":[201],"baselines.":[202],"discuss":[204],"practical":[205],"considerations":[206],"feature":[208],"extraction":[209],"inference":[211],"provide":[213],"qualitative":[214],"analyses":[215],"extended":[217],"sessions.":[218],"also":[220],"demonstrate":[221],"minimal":[223],"end-to-end":[224],"enhancement":[226],"system,":[227],"showing":[228],"offers":[232],"clear":[233],"advantages":[234],"extremely":[236],"multiple":[240]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-29T00:00:00"}
