{"id":"https://openalex.org/W4391021723","doi":"https://doi.org/10.1109/asru57964.2023.10389644","title":"Improving Multilingual and Code-Switching ASR Using Large Language Model Generated Text","display_name":"Improving Multilingual and Code-Switching ASR Using Large Language Model Generated Text","publication_year":2023,"publication_date":"2023-12-16","ids":{"openalex":"https://openalex.org/W4391021723","doi":"https://doi.org/10.1109/asru57964.2023.10389644"},"language":"en","primary_location":{"id":"doi:10.1109/asru57964.2023.10389644","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100691013","display_name":"Ke Hu","orcid":"https://orcid.org/0000-0001-7501-0420"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ke Hu","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070513394","display_name":"Tara N. Sainath","orcid":"https://orcid.org/0000-0002-4126-6556"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tara N. Sainath","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100374448","display_name":"Bo Li","orcid":"https://orcid.org/0000-0002-6711-3603"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bo Li","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100433648","display_name":"Yu Zhang","orcid":"https://orcid.org/0000-0002-9505-1833"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yu Zhang","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100349974","display_name":"Yong Cheng","orcid":"https://orcid.org/0000-0001-9043-8302"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yong Cheng","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453544","display_name":"Tao Wang","orcid":"https://orcid.org/0000-0002-5121-0599"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tao Wang","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100326151","display_name":"Yujing Zhang","orcid":"https://orcid.org/0000-0003-3878-0690"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yujing Zhang","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015466440","display_name":"Frederick Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Frederick Liu","raw_affiliation_strings":["Google LLC,USA","Google LLC, USA"],"affiliations":[{"raw_affiliation_string":"Google LLC,USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google LLC, USA","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100691013"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":0.8526,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.79814428,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.8483890295028687},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7947555780410767},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6084420680999756},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5683177709579468},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.4963684678077698},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4824724495410919},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.46608230471611023},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45552217960357666},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.43618762493133545},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3818933367729187},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.36363720893859863},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17663386464118958},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1346781849861145},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07117977738380432}],"concepts":[{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.8483890295028687},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7947555780410767},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6084420680999756},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5683177709579468},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.4963684678077698},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4824724495410919},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.46608230471611023},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45552217960357666},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.43618762493133545},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3818933367729187},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.36363720893859863},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17663386464118958},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1346781849861145},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07117977738380432},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru57964.2023.10389644","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1828163288","https://openalex.org/W2577366047","https://openalex.org/W2791281350","https://openalex.org/W2899073901","https://openalex.org/W2939069254","https://openalex.org/W2963240019","https://openalex.org/W2963431393","https://openalex.org/W2972417954","https://openalex.org/W3016234571","https://openalex.org/W3034724424","https://openalex.org/W3097961301","https://openalex.org/W3163203022","https://openalex.org/W3168867926","https://openalex.org/W3171500670","https://openalex.org/W3174770825","https://openalex.org/W3176614736","https://openalex.org/W3198442913","https://openalex.org/W3207222250","https://openalex.org/W4205991051","https://openalex.org/W4223622550","https://openalex.org/W4224308101","https://openalex.org/W4225295099","https://openalex.org/W4225319488","https://openalex.org/W4226120743","https://openalex.org/W4281770669","https://openalex.org/W4296069150","https://openalex.org/W4319862474","https://openalex.org/W4319862717","https://openalex.org/W4322718191","https://openalex.org/W4322825254","https://openalex.org/W4372259777","https://openalex.org/W4372266937","https://openalex.org/W4375958083","https://openalex.org/W4381827575","https://openalex.org/W4385245566","https://openalex.org/W4385823078","https://openalex.org/W6638749077","https://openalex.org/W6739901393","https://openalex.org/W6755461288","https://openalex.org/W6796581206","https://openalex.org/W6803092890","https://openalex.org/W6805239564","https://openalex.org/W6810081322","https://openalex.org/W6850477478","https://openalex.org/W6850625674","https://openalex.org/W6852326057","https://openalex.org/W6852800892","https://openalex.org/W6853998256"],"related_works":["https://openalex.org/W2163874654","https://openalex.org/W1566315437","https://openalex.org/W4221142855","https://openalex.org/W2594897229","https://openalex.org/W2151348424","https://openalex.org/W2050138804","https://openalex.org/W767271433","https://openalex.org/W4290708361","https://openalex.org/W2129812225","https://openalex.org/W2523799048"],"abstract_inverted_index":{"We":[0,77],"investigate":[1],"using":[2,43],"large":[3],"language":[4],"models":[5],"(LLMs)":[6],"to":[7,39,62,66,109,113,123,139],"generate":[8,40,67,140],"text-only":[9],"training":[10],"data":[11,42,54,73],"for":[12,74,127,151,181],"improving":[13],"multilingual":[14,28,69,89,94,188],"and":[15,90,144,164,170,184],"code-switching":[16,91,133,142,153,190],"automatic":[17],"speech":[18],"recognition":[19],"(ASR)":[20],"through":[21],"a":[22,27,31,97,114,146,152],"text":[23,41,53,72,75,117,143,182],"injection":[24,186],"method.":[25],"In":[26],"setup":[29],"or":[30,70,189],"low-resource":[32],"scenario":[33],"such":[34],"as":[35,156,158],"code-switching,":[36],"we":[37,58,135],"propose":[38],"the":[44,51,132],"state-of-the-art":[45],"PaLM":[46,64],"2.":[47],"To":[48],"better":[49],"match":[50],"generated":[52],"with":[55],"specific":[56],"tasks,":[57],"use":[59,136],"prompt":[60],"tuning":[61],"adapt":[63],"2":[65],"domain-relevant":[68],"code-switched":[71],"injection.":[76,118],"can":[78],"achieve":[79,145],"significant":[80],"improvements":[81],"in":[82,87,131,161],"Word":[83],"Error":[84],"Rate":[85],"(WER)":[86],"both":[88,162],"scenarios.":[92],"The":[93,119],"experiment":[95],"shows":[96],"$6.2":[98],"\\%$":[99,108,125,169,172],"relative":[100,148],"WER":[101,149,159],"reduction":[102,150],"on":[103],"average,":[104],"i.e.,":[105],"from":[106],"$11.25":[107],"$10.55":[110],"\\%$,":[111],"compared":[112],"baseline":[115],"without":[116],"improvement":[120,126],"is":[121],"up":[122],"$23.1":[124],"certain":[128],"languages.":[129],"While":[130],"scenario,":[134],"English-only":[137],"prompts":[138],"Mandarin-English":[141],"3.6%":[147],"test":[154],"set,":[155],"well":[157],"reductions":[160],"English":[163],"Mandarin":[165],"monolingual":[166],"scenarios,":[167],"$5.3":[168],"$8.5":[171],"relative,":[173],"respectively.":[174],"Our":[175],"findings":[176],"demonstrate":[177],"that":[178],"leveraging":[179],"LLMs":[180],"generation":[183],"then":[185],"benefits":[187],"ASR":[191],"tasks.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
