{"id":"https://openalex.org/W4408345790","doi":"https://doi.org/10.1109/icassp49660.2025.10889894","title":"Enhancing Low-Resource ASR through Versatile TTS: Bridging the Data Gap","display_name":"Enhancing Low-Resource ASR through Versatile TTS: Bridging the Data Gap","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408345790","doi":"https://doi.org/10.1109/icassp49660.2025.10889894"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10889894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889894","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111310847","display_name":"Guanrou Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guanrou Yang","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016098560","display_name":"Yu Fan","orcid":"https://orcid.org/0000-0003-3743-3988"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fan Yu","raw_affiliation_strings":["Alibaba Group,Institute for Intelligent Computing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group,Institute for Intelligent Computing,China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100438492","display_name":"Ziyang Ma","orcid":"https://orcid.org/0000-0002-0623-9114"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyang Ma","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001133136","display_name":"Zhihao Du","orcid":"https://orcid.org/0000-0003-3509-9322"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhihao Du","raw_affiliation_strings":["Alibaba Group,Institute for Intelligent Computing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group,Institute for Intelligent Computing,China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109593343","display_name":"Zhifu Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhifu Gao","raw_affiliation_strings":["Alibaba Group,Institute for Intelligent Computing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group,Institute for Intelligent Computing,China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055433405","display_name":"Shiliang Zhang","orcid":"https://orcid.org/0000-0001-9053-9314"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiliang Zhang","raw_affiliation_strings":["Alibaba Group,Institute for Intelligent Computing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba Group,Institute for Intelligent Computing,China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101644122","display_name":"Xie Chen","orcid":"https://orcid.org/0000-0003-1295-9166"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xie Chen","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute, X-LANCE Lab,China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111310847"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":9.3032,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.98057501,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9027000069618225,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9027000069618225,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.9296509027481079},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6548376083374023},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.11990749835968018}],"concepts":[{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.9296509027481079},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6548376083374023},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.11990749835968018}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10889894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889894","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.5199999809265137}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W2890964092","https://openalex.org/W2936774411","https://openalex.org/W2963609956","https://openalex.org/W2983434507","https://openalex.org/W3015522062","https://openalex.org/W3015654635","https://openalex.org/W3024464021","https://openalex.org/W3095350795","https://openalex.org/W3097206152","https://openalex.org/W3097777922","https://openalex.org/W3208049241","https://openalex.org/W3211278025","https://openalex.org/W4252812408","https://openalex.org/W4380047557","https://openalex.org/W4385572536","https://openalex.org/W4385822824","https://openalex.org/W4391833199","https://openalex.org/W4392904157","https://openalex.org/W4392909810","https://openalex.org/W4402111804","https://openalex.org/W4403653255","https://openalex.org/W4403653755","https://openalex.org/W4403653940","https://openalex.org/W4406417959","https://openalex.org/W6771467084","https://openalex.org/W6777694618","https://openalex.org/W6795261426","https://openalex.org/W6847363464","https://openalex.org/W6848735303","https://openalex.org/W6850334629","https://openalex.org/W6852653005","https://openalex.org/W6869301554","https://openalex.org/W6869471027","https://openalex.org/W6870225445"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4388870064","https://openalex.org/W2210139803","https://openalex.org/W4235186151","https://openalex.org/W2054685365","https://openalex.org/W2056057048","https://openalex.org/W2667588871","https://openalex.org/W2272354214"],"abstract_inverted_index":{"While":[0],"automatic":[1],"speech":[2,46,118],"recognition":[3],"(ASR)":[4],"systems":[5],"have":[6],"achieved":[7],"remarkable":[8],"performance":[9,85],"with":[10,29,47,139],"large-scale":[11],"datasets,":[12],"their":[13],"efficacy":[14],"remains":[15],"inadequate":[16],"in":[17,148],"low-resource":[18,79,94,173],"settings,":[19],"encompassing":[20],"dialects,":[21],"accents,":[22],"minority":[23],"languages,":[24],"and":[25,38,51,64,83,104,133,158,168],"long-tail":[26],"hotwords,":[27],"domains":[28],"significant":[30],"practical":[31,65,162],"relevance.":[32],"With":[33],"the":[34,89,134,145,161,170],"advent":[35],"of":[36,44,78,92,116,136,164,172],"versatile":[37,98],"powerful":[39],"text-to-speech":[40],"(TTS)":[41],"models,":[42],"capable":[43],"generating":[45],"human-level":[48],"naturalness,":[49],"expressiveness,":[50],"diverse":[52],"speaker":[53,131],"profiles,":[54],"leveraging":[55],"TTS":[56,99],"for":[57,144,160],"ASR":[58,69,95,123,174],"data":[59,119,166],"augmentation":[60,167],"provides":[61],"a":[62,97],"cost-effective":[63],"approach":[66],"to":[67,122],"enhancing":[68,93],"performance.":[70],"Comprehensive":[71],"experiments":[72],"on":[73],"an":[74],"unprecedentedly":[75],"rich":[76],"variety":[77],"datasets":[80],"demonstrate":[81],"consistent":[82],"substantial":[84],"improvements,":[86],"proving":[87],"that":[88,120],"proposed":[90],"method":[91],"through":[96],"model":[100],"is":[101],"highly":[102],"effective":[103],"has":[105],"broad":[106],"application":[107,163],"prospects.":[108],"Furthermore,":[109],"we":[110],"delve":[111],"deeper":[112],"into":[113],"key":[114],"characteristics":[115],"synthesized":[117,137],"contribute":[121],"improvement,":[124],"examining":[125],"factors":[126],"such":[127],"as":[128],"text":[129,140],"diversity,":[130,132],"volume":[135],"data,":[138],"diversity":[141],"being":[142],"studied":[143],"first":[146],"time":[147],"this":[149],"work.":[150],"We":[151],"hope":[152],"our":[153],"findings":[154],"provide":[155],"helpful":[156],"guidance":[157],"reference":[159],"TTS-based":[165],"push":[169],"advancement":[171],"one":[175],"step":[176],"further.":[177]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":6}],"updated_date":"2026-05-10T08:33:47.465468","created_date":"2025-10-10T00:00:00"}
