{"id":"https://openalex.org/W4387869670","doi":"https://doi.org/10.1109/mlsp55844.2023.10285936","title":"Voice Direction-Of-Arrival Conversion","display_name":"Voice Direction-Of-Arrival Conversion","publication_year":2023,"publication_date":"2023-09-17","ids":{"openalex":"https://openalex.org/W4387869670","doi":"https://doi.org/10.1109/mlsp55844.2023.10285936"},"language":"en","primary_location":{"id":"doi:10.1109/mlsp55844.2023.10285936","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp55844.2023.10285936","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074950328","display_name":"I-Chun Chern","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"I-Chun Chern","raw_affiliation_strings":["Carnegie Mellon University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033466933","display_name":"Steffi Chern","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steffi Chern","raw_affiliation_strings":["Carnegie Mellon University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031290759","display_name":"Heng-Cheng Kuo","orcid":null},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Heng-Cheng Kuo","raw_affiliation_strings":["Academia Sinica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Academia Sinica","institution_ids":["https://openalex.org/I84653119"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034788095","display_name":"H. Eric Tseng","orcid":"https://orcid.org/0000-0001-9544-4226"},"institutions":[{"id":"https://openalex.org/I200870766","display_name":"Brookhaven National Laboratory","ror":"https://ror.org/02ex6cf31","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I200870766","https://openalex.org/I39565521","https://openalex.org/I4210142672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huan-Hsin Tseng","raw_affiliation_strings":["Brookhaven National Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Brookhaven National Laboratory","institution_ids":["https://openalex.org/I200870766"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064333828","display_name":"Kuo-Hsuan Hung","orcid":"https://orcid.org/0000-0002-6298-5269"},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kuo-Hsuan Hung","raw_affiliation_strings":["Academia Sinica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Academia Sinica","institution_ids":["https://openalex.org/I84653119"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044008055","display_name":"Yu Tsao","orcid":"https://orcid.org/0000-0001-6956-0418"},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yu Tsao","raw_affiliation_strings":["Academia Sinica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Academia Sinica","institution_ids":["https://openalex.org/I84653119"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5074950328"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":0.1915,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.45256513,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7625919580459595},{"id":"https://openalex.org/keywords/direction-of-arrival","display_name":"Direction of arrival","score":0.6824199557304382},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6363385319709778},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.5793941020965576},{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.5022552013397217},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.47723105549812317},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4296301007270813},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.410910964012146},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.2788664698600769},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17822042107582092},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.15047407150268555},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.14433318376541138}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7625919580459595},{"id":"https://openalex.org/C172051844","wikidata":"https://www.wikidata.org/wiki/Q5280438","display_name":"Direction of arrival","level":3,"score":0.6824199557304382},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6363385319709778},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.5793941020965576},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.5022552013397217},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.47723105549812317},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4296301007270813},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.410910964012146},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2788664698600769},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17822042107582092},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.15047407150268555},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14433318376541138},{"id":"https://openalex.org/C21822782","wikidata":"https://www.wikidata.org/wiki/Q131214","display_name":"Antenna (radio)","level":2,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mlsp55844.2023.10285936","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp55844.2023.10285936","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W658204242","https://openalex.org/W1603075283","https://openalex.org/W1969146847","https://openalex.org/W1979972347","https://openalex.org/W1988655689","https://openalex.org/W1990048725","https://openalex.org/W2045740791","https://openalex.org/W2057077708","https://openalex.org/W2061074721","https://openalex.org/W2066218102","https://openalex.org/W2109958193","https://openalex.org/W2113638573","https://openalex.org/W2128131274","https://openalex.org/W2166117654","https://openalex.org/W2194775991","https://openalex.org/W2298224832","https://openalex.org/W2398042854","https://openalex.org/W2611943505","https://openalex.org/W2640112133","https://openalex.org/W2763188033","https://openalex.org/W2767071179","https://openalex.org/W2810871807","https://openalex.org/W2952350176","https://openalex.org/W2962896155","https://openalex.org/W3095333614","https://openalex.org/W3104757150","https://openalex.org/W3162341667","https://openalex.org/W4205742757","https://openalex.org/W6645056189","https://openalex.org/W6784285862"],"related_works":["https://openalex.org/W3138471234","https://openalex.org/W4247958311","https://openalex.org/W4396832849","https://openalex.org/W2785089443","https://openalex.org/W2265117524","https://openalex.org/W4312431072","https://openalex.org/W1467576422","https://openalex.org/W4220730560","https://openalex.org/W2969390373","https://openalex.org/W2604471456"],"abstract_inverted_index":{"The":[0,100],"demand":[1],"for":[2],"augmented":[3],"reality":[4,8],"(AR)":[5],"and":[6,31,121],"virtual":[7,21],"(VR)":[9],"is":[10],"steadily":[11],"rising.":[12],"To":[13],"provide":[14],"the":[15,29,36,48,52,72,79,108],"best":[16],"user":[17],"experience":[18],"in":[19],"a":[20,60,87],"environment,":[22],"their":[23],"applications":[24],"must":[25],"ensure":[26],"consistency":[27],"between":[28],"visual":[30],"audio":[32],"signals":[33,76,113],"perceived":[34],"by":[35],"users.":[37],"For":[38],"example,":[39],"when":[40],"an":[41],"avatar":[42,53],"(sound":[43],"source)":[44],"speaks":[45],"while":[46,77,117],"moving,":[47],"arrival":[49,64],"direction":[50,62],"of":[51,63,74,110],"changes.":[54],"In":[55],"this":[56],"paper,":[57],"we":[58,84],"introduce":[59],"voice":[61],"(DOA)":[65],"conversion":[66,91],"task":[67],"that":[68,93,103],"aims":[69],"to":[70],"change":[71],"DOA":[73,90,98,109],"speech":[75,89,97,112,119],"keeping":[78],"remaining":[80],"components":[81],"unaltered.":[82],"Furthermore,":[83],"propose":[85],"DOAC-Net,":[86],"novel":[88],"system":[92],"can":[94,105],"perform":[95],"causal":[96],"conversion.":[99],"results":[101],"show":[102],"DOAC-Net":[104],"effectively":[106],"convert":[107],"multi-channel":[111],"with":[114],"little":[115],"distortion,":[116],"maintaining":[118],"quality":[120],"intelligibility.":[122]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2025-10-10T00:00:00"}
