{"id":"https://openalex.org/W4408345590","doi":"https://doi.org/10.1109/icassp49660.2025.10890756","title":"BiCG: Binaural Cue Generation from Unified HRTF Datasets","display_name":"BiCG: Binaural Cue Generation from Unified HRTF Datasets","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408345590","doi":"https://doi.org/10.1109/icassp49660.2025.10890756"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890756","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890756","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039514709","display_name":"Xikun Lu","orcid":"https://orcid.org/0000-0003-0156-8805"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xikun Lu","raw_affiliation_strings":["East China Normal University,Lab of Artificial Intelligence for Education,China"],"affiliations":[{"raw_affiliation_string":"East China Normal University,Lab of Artificial Intelligence for Education,China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100781540","display_name":"Yilei Wang","orcid":"https://orcid.org/0009-0000-2743-4595"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yilei Wang","raw_affiliation_strings":["East China Normal University,Lab of Artificial Intelligence for Education,China"],"affiliations":[{"raw_affiliation_string":"East China Normal University,Lab of Artificial Intelligence for Education,China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004094994","display_name":"Jinqiu Sang","orcid":"https://orcid.org/0000-0002-4368-8787"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinqiu Sang","raw_affiliation_strings":["East China Normal University,Lab of Artificial Intelligence for Education,China"],"affiliations":[{"raw_affiliation_string":"East China Normal University,Lab of Artificial Intelligence for Education,China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Institute of Acoustics Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5039514709"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":null,"apc_paid":null,"fwci":2.6381,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.88322182,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9416000247001648,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9416000247001648,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9223999977111816,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9190999865531921,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/binaural-recording","display_name":"Binaural recording","score":0.7800220251083374},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5774143934249878},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.4989032745361328},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.45497772097587585},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06472879648208618}],"concepts":[{"id":"https://openalex.org/C201247586","wikidata":"https://www.wikidata.org/wiki/Q5612967","display_name":"Binaural recording","level":2,"score":0.7800220251083374},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5774143934249878},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.4989032745361328},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45497772097587585},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06472879648208618}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890756","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890756","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322370","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1677820382","https://openalex.org/W1792834816","https://openalex.org/W1976125225","https://openalex.org/W2013020033","https://openalex.org/W2028115554","https://openalex.org/W2064394144","https://openalex.org/W2067042811","https://openalex.org/W2096439661","https://openalex.org/W2108668360","https://openalex.org/W2119613492","https://openalex.org/W2622609602","https://openalex.org/W2795721446","https://openalex.org/W2898527280","https://openalex.org/W2942039225","https://openalex.org/W3044194010","https://openalex.org/W4280592948","https://openalex.org/W4297846303","https://openalex.org/W4316037400","https://openalex.org/W4372185154","https://openalex.org/W4372266895","https://openalex.org/W4372348473","https://openalex.org/W4386764115","https://openalex.org/W4392667195","https://openalex.org/W4392902990","https://openalex.org/W4392910510","https://openalex.org/W6677656871","https://openalex.org/W6740650116","https://openalex.org/W6779753539"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2766995619","https://openalex.org/W4224270619","https://openalex.org/W2579722767","https://openalex.org/W2168148781","https://openalex.org/W1991848873","https://openalex.org/W2026165661","https://openalex.org/W1979944951"],"abstract_inverted_index":{"Head-related":[0],"transfer":[1],"functions":[2],"(HRTFs)":[3],"are":[4,35],"important":[5],"for":[6,37],"spatial":[7],"audio":[8],"reproduction":[9,39],"in":[10,50,100],"immersive":[11],"systems.":[12],"Most":[13],"existing":[14,96],"data-driven":[15,60],"methods":[16,27,99],"focus":[17],"on":[18],"personalized":[19],"HRTF":[20,48,137],"estimation":[21],"of":[22,31,59,102],"monaural":[23],"spectral":[24],"factors.":[25],"These":[26],"ignore":[28],"the":[29,43,57],"importance":[30],"binaural":[32,38,66,103,124],"cues,":[33],"which":[34,71],"essential":[36],"and":[40,84,116],"perception.":[41],"Moreover,":[42],"significant":[44],"differences":[45,82,87],"among":[46],"various":[47,112],"datasets":[49],"aspects":[51],"such":[52],"as":[53],"measurement":[54],"setup":[55],"limit":[56],"potential":[58],"methods.":[61],"This":[62],"paper":[63],"proposes":[64],"a":[65],"cue":[67,104,125],"generation":[68,105,126],"method":[69,94],"(BiCG),":[70],"utilizes":[72],"an":[73],"implicit":[74],"neural":[75,97],"network":[76],"(INN)":[77],"to":[78],"estimate":[79],"interaural":[80,85],"level":[81],"(ILDs)":[83],"time":[86],"(ITDs).":[88],"Experimental":[89],"results":[90,118],"show":[91,119],"that":[92,120],"our":[93],"outperforms":[95],"field":[98],"terms":[101],"quality":[106],"across":[107,128],"datasets.":[108,129],"We":[109],"also":[110],"evaluate":[111],"data":[113],"preprocessing":[114],"methods,":[115],"experimental":[117],"extreme":[121],"smoothing":[122],"improves":[123],"performance":[127],"The":[130],"work":[131],"provides":[132],"new":[133],"insights":[134],"into":[135],"enhancing":[136],"modeling.":[138]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
