{"id":"https://openalex.org/W4390096820","doi":"https://doi.org/10.1109/taslp.2023.3346297","title":"Binaural Sound Source Distance Estimation and Localization for a Moving Listener","display_name":"Binaural Sound Source Distance Estimation and Localization for a Moving Listener","publication_year":2023,"publication_date":"2023-12-22","ids":{"openalex":"https://openalex.org/W4390096820","doi":"https://doi.org/10.1109/taslp.2023.3346297"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2023.3346297","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3346297","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/6633080/10372100.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/6570655/6633080/10372100.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025199613","display_name":"Daniel Krause","orcid":"https://orcid.org/0000-0003-2704-636X"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Daniel Aleksander Krause","raw_affiliation_strings":["Computing Sciences, Tampere University, Tampere, Finland"],"raw_orcid":"https://orcid.org/0000-0003-2704-636X","affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Tampere, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103280229","display_name":"Guillermo Garc\u00eda-Barrios","orcid":"https://orcid.org/0000-0001-7925-0915"},"institutions":[{"id":"https://openalex.org/I88060688","display_name":"Universidad Polit\u00e9cnica de Madrid","ror":"https://ror.org/03n6nwv02","country_code":"ES","type":"education","lineage":["https://openalex.org/I88060688"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Guillermo Garc\u00eda-Barrios","raw_affiliation_strings":["Group on Acoustics and MultiMedia Applications, Universidad Polit&#x00E9;cnica de Madrid, Madrid, Spain"],"raw_orcid":"https://orcid.org/0000-0001-7925-0915","affiliations":[{"raw_affiliation_string":"Group on Acoustics and MultiMedia Applications, Universidad Polit&#x00E9;cnica de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I88060688"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010846139","display_name":"Archontis Politis","orcid":"https://orcid.org/0000-0002-0595-2356"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Archontis Politis","raw_affiliation_strings":["Computing Sciences, Tampere University, Tampere, Finland"],"raw_orcid":"https://orcid.org/0000-0002-0595-2356","affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Tampere, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079981416","display_name":"Annamaria Mesaros","orcid":"https://orcid.org/0000-0002-6640-9752"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Annamaria Mesaros","raw_affiliation_strings":["Computing Sciences, Tampere University, Tampere, Finland"],"raw_orcid":"https://orcid.org/0000-0002-6640-9752","affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Tampere, Finland","institution_ids":["https://openalex.org/I166825849"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":{"value":800,"currency":"EUR","value_usd":862},"fwci":4.2495,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.95530519,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"32","issue":null,"first_page":"996","last_page":"1011"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/binaural-recording","display_name":"Binaural recording","score":0.8614394664764404},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.6858760714530945},{"id":"https://openalex.org/keywords/sound-localization","display_name":"Sound localization","score":0.6722195148468018},{"id":"https://openalex.org/keywords/critical-distance","display_name":"Critical distance","score":0.6069751977920532},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.5535969734191895},{"id":"https://openalex.org/keywords/acoustic-source-localization","display_name":"Acoustic source localization","score":0.5114794969558716},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.451569527387619},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43337857723236084},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3126392364501953},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.14608237147331238},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13777101039886475},{"id":"https://openalex.org/keywords/sound-power","display_name":"Sound power","score":0.07856583595275879}],"concepts":[{"id":"https://openalex.org/C201247586","wikidata":"https://www.wikidata.org/wiki/Q5612967","display_name":"Binaural recording","level":2,"score":0.8614394664764404},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.6858760714530945},{"id":"https://openalex.org/C68236139","wikidata":"https://www.wikidata.org/wiki/Q765652","display_name":"Sound localization","level":2,"score":0.6722195148468018},{"id":"https://openalex.org/C24723263","wikidata":"https://www.wikidata.org/wiki/Q1571884","display_name":"Critical distance","level":4,"score":0.6069751977920532},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.5535969734191895},{"id":"https://openalex.org/C93240960","wikidata":"https://www.wikidata.org/wiki/Q217270","display_name":"Acoustic source localization","level":3,"score":0.5114794969558716},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.451569527387619},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43337857723236084},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3126392364501953},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.14608237147331238},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13777101039886475},{"id":"https://openalex.org/C67514181","wikidata":"https://www.wikidata.org/wiki/Q1588477","display_name":"Sound power","level":3,"score":0.07856583595275879},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2023.3346297","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3346297","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/6633080/10372100.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:trepo.tuni.fi:10024/207873","is_oa":true,"landing_page_url":"https://trepo.tuni.fi/handle/10024/207873","pdf_url":null,"source":{"id":"https://openalex.org/S7407055260","display_name":"Trepo - Institutional Repository of Tampere University","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/taslp.2023.3346297","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3346297","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/6633080/10372100.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2360061192","display_name":"Teaching machines to listen","funder_award_id":"332063","funder_id":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland"},{"id":"https://openalex.org/G4923903852","display_name":null,"funder_award_id":"332063","funder_id":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland"}],"funders":[{"id":"https://openalex.org/F4320321108","display_name":"Academy of Finland","ror":"https://ror.org/05k73zm37"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390096820.pdf","grobid_xml":"https://content.openalex.org/works/W4390096820.grobid-xml"},"referenced_works_count":85,"referenced_works":["https://openalex.org/W126779258","https://openalex.org/W1518870451","https://openalex.org/W1555217905","https://openalex.org/W1581848821","https://openalex.org/W1591446137","https://openalex.org/W1635512741","https://openalex.org/W1844944916","https://openalex.org/W1967178846","https://openalex.org/W1978659076","https://openalex.org/W2008955172","https://openalex.org/W2022347952","https://openalex.org/W2043217973","https://openalex.org/W2045608181","https://openalex.org/W2046317813","https://openalex.org/W2075463086","https://openalex.org/W2075562975","https://openalex.org/W2078487085","https://openalex.org/W2086110556","https://openalex.org/W2095425552","https://openalex.org/W2103088716","https://openalex.org/W2109689830","https://openalex.org/W2113638573","https://openalex.org/W2114863372","https://openalex.org/W2120920848","https://openalex.org/W2128131274","https://openalex.org/W2147598479","https://openalex.org/W2152669807","https://openalex.org/W2153248083","https://openalex.org/W2162607306","https://openalex.org/W2166682639","https://openalex.org/W2241211221","https://openalex.org/W2395089112","https://openalex.org/W2402058645","https://openalex.org/W2403149086","https://openalex.org/W2490695385","https://openalex.org/W2541714600","https://openalex.org/W2592109325","https://openalex.org/W2611943505","https://openalex.org/W2617440445","https://openalex.org/W2763188033","https://openalex.org/W2765962757","https://openalex.org/W2772736377","https://openalex.org/W2772956764","https://openalex.org/W2800383133","https://openalex.org/W2810934215","https://openalex.org/W2884424734","https://openalex.org/W2892163332","https://openalex.org/W2898268964","https://openalex.org/W2899564885","https://openalex.org/W2903426563","https://openalex.org/W2917254586","https://openalex.org/W2933305660","https://openalex.org/W2962731344","https://openalex.org/W2982341288","https://openalex.org/W3029436999","https://openalex.org/W3104196160","https://openalex.org/W3104757150","https://openalex.org/W3105684258","https://openalex.org/W3113688134","https://openalex.org/W3117312351","https://openalex.org/W3134150402","https://openalex.org/W3186050523","https://openalex.org/W3197097128","https://openalex.org/W3206552727","https://openalex.org/W4206633762","https://openalex.org/W4229050860","https://openalex.org/W4236344233","https://openalex.org/W4283759342","https://openalex.org/W4295312788","https://openalex.org/W4307782669","https://openalex.org/W4311648872","https://openalex.org/W4312654700","https://openalex.org/W4312920378","https://openalex.org/W6633378904","https://openalex.org/W6662704774","https://openalex.org/W6676895149","https://openalex.org/W6684354967","https://openalex.org/W6729017730","https://openalex.org/W6731619450","https://openalex.org/W6766975602","https://openalex.org/W6766978945","https://openalex.org/W6772220224","https://openalex.org/W6796629309","https://openalex.org/W6801320650","https://openalex.org/W6846841993"],"related_works":["https://openalex.org/W1991848873","https://openalex.org/W3004570917","https://openalex.org/W4389240440","https://openalex.org/W2084430325","https://openalex.org/W2317500761","https://openalex.org/W2809056180","https://openalex.org/W4372260199","https://openalex.org/W1578934236","https://openalex.org/W2329131175","https://openalex.org/W61728244"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,36],"investigate":[4],"the":[5,42,93,101,106],"tasks":[6,32],"of":[7,29,40,45,103,114,128,183],"binaural":[8],"source":[9,47],"distance":[10,48,133,164,190],"estimation":[11,15,49,165],"(SDE)":[12],"and":[13,50,74,86,99,130,163,187,199],"direction-of-arrival":[14],"(DOAE)":[16],"using":[17],"motion-based":[18,171],"cues":[19,172],"in":[20,160,185,189],"a":[21,24,54,64,67,71,75,80,125,131,167,176,181,193],"scenario":[22],"with":[23,53,70,142,175],"walking":[25,147],"listener.":[26],"On":[27],"top":[28],"performing":[30],"both":[31,161],"as":[33,149,151,173],"separate":[34,202],"problems,":[35],"study":[37,83],"two":[38],"methods":[39],"solving":[41],"joint":[43,194],"task":[44],"simultaneous":[46],"localization":[51],"(SDEL),":[52],"single":[55],"model.":[56],"Experiments":[57],"are":[58,139],"conducted":[59],"for":[60,121,166,192,201],"three":[61,115],"different":[62],"scenarios:":[63],"static":[65,68,177],"receiver;":[66],"receiver":[69],"rotating":[72],"head;":[73],"freely":[76],"moving":[77],"listener":[78],"inside":[79],"room.":[81],"The":[82,109,154],"proposes":[84],"rotation":[85],"translation":[87],"features":[88],"to":[89,135,144],"include":[90,180],"information":[91],"about":[92],"receiver's":[94],"motion":[95],"during":[96],"model":[97,168],"training":[98],"studies":[100],"effects":[102],"these":[104],"on":[105],"final":[107],"performance.":[108],"work":[110],"includes":[111],"extended":[112],"simulation":[113],"datasets":[116],"containing":[117],"numerous":[118],"testing":[119],"scenarios":[120],"sound":[122],"sources,":[123],"covering":[124],"wide":[126],"range":[127],"DOAs":[129],"source-to-receiver":[132,152],"up":[134],"15":[136],"m.":[137],"Results":[138],"further":[140],"analyzed":[141],"respect":[143],"room":[145],"reverberation,":[146],"speed,":[148],"well":[150],"distance.":[153],"presented":[155],"outcomes":[156],"show":[157],"large":[158],"improvements":[159],"DOA":[162,186],"that":[169],"uses":[170],"compared":[174],"scenario.":[178],"These":[179],"decrease":[182],"9.50\u00c2\u00b0":[184],"1.56m":[188],"errors":[191],"model,":[195],"followed":[196],"by":[197],"16.17\u00c2\u00b0":[198],"0.17m":[200],"models.":[203]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
