{"id":"https://openalex.org/W4406461663","doi":"https://doi.org/10.1109/slt61566.2024.10832265","title":"Enhancing Code-Switching Speech Recognition With LID-Based Collaborative Mixture of Experts Model","display_name":"Enhancing Code-Switching Speech Recognition With LID-Based Collaborative Mixture of Experts Model","publication_year":2024,"publication_date":"2024-12-02","ids":{"openalex":"https://openalex.org/W4406461663","doi":"https://doi.org/10.1109/slt61566.2024.10832265"},"language":"en","primary_location":{"id":"doi:10.1109/slt61566.2024.10832265","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832265","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109692702","display_name":"Hukai Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hukai Huang","raw_affiliation_strings":["Xiamen University,School of Informatics,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Informatics,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111094266","display_name":"Jiayan Lin","orcid":"https://orcid.org/0000-0002-0305-2784"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiayan Lin","raw_affiliation_strings":["Xiamen University,School of Informatics,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Informatics,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113251188","display_name":"Kaidi Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaidi Wang","raw_affiliation_strings":["Xiamen University,School of Informatics,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Informatics,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112932714","display_name":"Yishuang Li","orcid":"https://orcid.org/0009-0003-3466-0701"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yishuang Li","raw_affiliation_strings":["Xiamen University,Institute of Artificial Intelligence,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Institute of Artificial Intelligence,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111310824","display_name":"Wenhao Guan","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenhao Guan","raw_affiliation_strings":["Xiamen University,School of Informatics,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Informatics,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100412926","display_name":"Lin Li","orcid":"https://orcid.org/0000-0003-0426-6546"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Li","raw_affiliation_strings":["Xiamen University,School of Electronic Science and Engineering,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Electronic Science and Engineering,China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011997254","display_name":"Qingyang Hong","orcid":"https://orcid.org/0000-0001-7380-8690"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingyang Hong","raw_affiliation_strings":["Xiamen University,School of Informatics,China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,School of Informatics,China","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5109692702"],"corresponding_institution_ids":["https://openalex.org/I191208505"],"apc_list":null,"apc_paid":null,"fwci":0.7274,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.78373592,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"30","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7816150188446045},{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.7627357244491577},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6696460843086243},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4856361448764801},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33591973781585693},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33172452449798584},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.23830446600914001},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09774747490882874}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7816150188446045},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.7627357244491577},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6696460843086243},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4856361448764801},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33591973781585693},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33172452449798584},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.23830446600914001},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09774747490882874},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/slt61566.2024.10832265","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832265","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W854541894","https://openalex.org/W1494198834","https://openalex.org/W2127141656","https://openalex.org/W2150884987","https://openalex.org/W2327501763","https://openalex.org/W2526425061","https://openalex.org/W2889124873","https://openalex.org/W2892009249","https://openalex.org/W2896558859","https://openalex.org/W2936774411","https://openalex.org/W2938792232","https://openalex.org/W2939069254","https://openalex.org/W2964156075","https://openalex.org/W2971840980","https://openalex.org/W2972384088","https://openalex.org/W2972954451","https://openalex.org/W2973082572","https://openalex.org/W3016010032","https://openalex.org/W3042170933","https://openalex.org/W3096032230","https://openalex.org/W3096122506","https://openalex.org/W3097777922","https://openalex.org/W3156323585","https://openalex.org/W4221167707","https://openalex.org/W4281770669","https://openalex.org/W4287391717","https://openalex.org/W4288408927","https://openalex.org/W4297841499","https://openalex.org/W4372269995","https://openalex.org/W4385822813","https://openalex.org/W4385822875","https://openalex.org/W4385823078","https://openalex.org/W6623517193","https://openalex.org/W6760937267","https://openalex.org/W6780815891","https://openalex.org/W6788811087"],"related_works":["https://openalex.org/W2771594921","https://openalex.org/W2432897346","https://openalex.org/W2181336723","https://openalex.org/W4389976243","https://openalex.org/W3158134258","https://openalex.org/W3138119129","https://openalex.org/W2940588741","https://openalex.org/W2293063924","https://openalex.org/W2974240475","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Due":[0],"to":[1,63,84,105,125],"the":[2,64,89,115,132],"inherent":[3],"difficulty":[4],"in":[5],"modeling":[6],"phonetic":[7],"similarities":[8],"across":[9],"different":[10],"languages,":[11],"code-switching":[12],"speech":[13],"recognition":[14],"presents":[15],"a":[16,22,24,32,39,100],"formidable":[17],"challenge.":[18],"This":[19,57],"study":[20],"proposes":[21],"Collaborative-MoE,":[23],"Mixture":[25],"of":[26,91,117,137],"Experts":[27],"(MoE)":[28],"model":[29],"that":[30],"leverages":[31],"collaborative":[33],"mechanism":[34],"among":[35],"expert":[36,74,98],"groups.":[37],"Initially,":[38],"preceding":[40],"routing":[41,61],"network":[42,75,102],"explicitly":[43],"learns":[44],"Language":[45],"Identification":[46],"(LID)":[47],"tasks":[48],"and":[49],"selects":[50],"experts":[51],"based":[52],"on":[53,73,108],"acquired":[54],"LID":[55,79],"weights.":[56],"process":[58],"ensures":[59],"robust":[60],"information":[62],"MoE":[65,138],"layer,":[66],"mitigating":[67],"interference":[68],"from":[69],"diverse":[70],"language":[71,97],"domains":[72],"parameter":[76],"updates.":[77],"The":[78],"weights":[80],"are":[81],"also":[82],"employed":[83],"facilitate":[85],"inter-group":[86],"collaboration,":[87],"enabling":[88],"integration":[90],"language-specific":[92],"representations.":[93],"Furthermore,":[94],"within":[95],"each":[96],"group,":[99],"gating":[101],"operates":[103],"unsupervised":[104],"foster":[106],"collaboration":[107],"attributes":[109],"beyond":[110],"language.":[111],"Extensive":[112],"experiments":[113],"demonstrate":[114],"efficacy":[116],"our":[118,129],"approach,":[119],"achieving":[120],"significant":[121],"performance":[122],"enhancements":[123],"compared":[124],"alternative":[126],"methods.":[127],"Importantly,":[128],"method":[130],"preserves":[131],"efficient":[133],"inference":[134],"capabilities":[135],"characteristic":[136],"models":[139],"without":[140],"necessitating":[141],"additional":[142],"pre-training.":[143]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
