{"id":"https://openalex.org/W3217003515","doi":"https://doi.org/10.1109/icassp43922.2022.9747537","title":"Joint Modeling of Code-Switched and Monolingual ASR via Conditional Factorization","display_name":"Joint Modeling of Code-Switched and Monolingual ASR via Conditional Factorization","publication_year":2022,"publication_date":"2022-04-27","ids":{"openalex":"https://openalex.org/W3217003515","doi":"https://doi.org/10.1109/icassp43922.2022.9747537","mag":"3217003515"},"language":"en","primary_location":{"id":"doi:10.1109/icassp43922.2022.9747537","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747537","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021201726","display_name":"Brian Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Brian Yan","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005304261","display_name":"Chunlei Zhang","orcid":"https://orcid.org/0000-0002-3851-2357"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chunlei Zhang","raw_affiliation_strings":["Tencent AI Lab,USA","Tencent AI Lab, USA"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,USA","institution_ids":["https://openalex.org/I70745867"]},{"raw_affiliation_string":"Tencent AI Lab, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100770786","display_name":"Meng Yu","orcid":"https://orcid.org/0000-0003-2554-2888"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Meng Yu","raw_affiliation_strings":["Tencent AI Lab,USA","Tencent AI Lab, USA"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,USA","institution_ids":["https://openalex.org/I70745867"]},{"raw_affiliation_string":"Tencent AI Lab, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101785327","display_name":"Shi-Xiong Zhang","orcid":"https://orcid.org/0009-0007-7803-2407"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shi-Xiong Zhang","raw_affiliation_strings":["Tencent AI Lab,USA","Tencent AI Lab, USA"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,USA","institution_ids":["https://openalex.org/I70745867"]},{"raw_affiliation_string":"Tencent AI Lab, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068873086","display_name":"Siddharth Dalmia","orcid":"https://orcid.org/0000-0003-0437-5988"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Siddharth Dalmia","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024324721","display_name":"Dan Berrebbi","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dan Berrebbi","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106404246","display_name":"Chao Weng","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Weng","raw_affiliation_strings":["Tencent AI Lab,China","Tencent AI Lab, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent AI Lab, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034476404","display_name":"Dong Yu","orcid":"https://orcid.org/0000-0003-0520-6844"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Yu","raw_affiliation_strings":["Tencent AI Lab,USA","Tencent AI Lab, USA"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,USA","institution_ids":["https://openalex.org/I70745867"]},{"raw_affiliation_string":"Tencent AI Lab, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5021201726"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.1434,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.7918552,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"6412","last_page":"6416"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8252497911453247},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6478205919265747},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.573533296585083},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.570501446723938},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5514130592346191},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.5286106467247009},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49389082193374634},{"id":"https://openalex.org/keywords/factorization","display_name":"Factorization","score":0.4714297652244568},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4417656660079956},{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.414181113243103},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17997294664382935},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13304725289344788},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0891348123550415},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.06189310550689697}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8252497911453247},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6478205919265747},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.573533296585083},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.570501446723938},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5514130592346191},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.5286106467247009},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49389082193374634},{"id":"https://openalex.org/C187834632","wikidata":"https://www.wikidata.org/wiki/Q188804","display_name":"Factorization","level":2,"score":0.4714297652244568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4417656660079956},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.414181113243103},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17997294664382935},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13304725289344788},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0891348123550415},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.06189310550689697},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C170154142","wikidata":"https://www.wikidata.org/wiki/Q150737","display_name":"Architectural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp43922.2022.9747537","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747537","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7599999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W308745112","https://openalex.org/W1524333225","https://openalex.org/W1543365580","https://openalex.org/W1828163288","https://openalex.org/W2049032416","https://openalex.org/W2064675550","https://openalex.org/W2084543186","https://openalex.org/W2114569717","https://openalex.org/W2127141656","https://openalex.org/W2130466720","https://openalex.org/W2176263492","https://openalex.org/W2345986601","https://openalex.org/W2578893474","https://openalex.org/W2740286348","https://openalex.org/W2766219058","https://openalex.org/W2789353687","https://openalex.org/W2798348125","https://openalex.org/W2809978471","https://openalex.org/W2811159785","https://openalex.org/W2891616026","https://openalex.org/W2899073901","https://openalex.org/W2936774411","https://openalex.org/W2938792232","https://openalex.org/W2939069254","https://openalex.org/W2939111082","https://openalex.org/W2939757332","https://openalex.org/W2948974868","https://openalex.org/W2962704885","https://openalex.org/W2962780374","https://openalex.org/W2962784628","https://openalex.org/W2963248296","https://openalex.org/W2963431393","https://openalex.org/W2964002616","https://openalex.org/W2970776961","https://openalex.org/W2972702443","https://openalex.org/W2989224798","https://openalex.org/W3015615177","https://openalex.org/W3025165719","https://openalex.org/W3029522047","https://openalex.org/W3042170933","https://openalex.org/W3096032230","https://openalex.org/W3096122506","https://openalex.org/W3097306574","https://openalex.org/W3097777922","https://openalex.org/W3160201895","https://openalex.org/W3163793923","https://openalex.org/W3178647810","https://openalex.org/W3196485121","https://openalex.org/W4240060192","https://openalex.org/W4288408927","https://openalex.org/W6610887377","https://openalex.org/W6631362777","https://openalex.org/W6638575559","https://openalex.org/W6638749077","https://openalex.org/W6685322675","https://openalex.org/W6732557975","https://openalex.org/W6755193724","https://openalex.org/W6755461288","https://openalex.org/W6756296142","https://openalex.org/W6760937267","https://openalex.org/W6770250107","https://openalex.org/W6777856084","https://openalex.org/W6780815891","https://openalex.org/W6797726355"],"related_works":["https://openalex.org/W2771594921","https://openalex.org/W2432897346","https://openalex.org/W2181336723","https://openalex.org/W4389976243","https://openalex.org/W3158134258","https://openalex.org/W3138119129","https://openalex.org/W2940588741","https://openalex.org/W2293063924","https://openalex.org/W2974240475","https://openalex.org/W2379610230"],"abstract_inverted_index":{"Conversational":[0],"bilingual":[1,38,61,102],"speech":[2,39,104],"encompasses":[3],"three":[4],"types":[5,11],"of":[6,30,97],"utterances:":[7],"two":[8],"purely":[9],"monolingual":[10,32,44,74,108],"and":[12,33,109],"one":[13],"intra-sententially":[14],"code-switched":[15,110],"type.":[16],"In":[17],"this":[18,79],"work,":[19],"we":[20],"propose":[21],"a":[22],"general":[23],"framework":[24,52,83],"to":[25],"jointly":[26],"model":[27,100],"the":[28,31,43,59,95],"likelihoods":[29],"code-switch":[34],"sub-tasks":[35,45],"that":[36,58,78],"comprise":[37],"recognition.":[40],"By":[41],"defining":[42],"with":[46],"label-to-frame":[47],"synchronization,":[48],"our":[49,98],"joint":[50,82],"modeling":[51],"can":[53,84],"be":[54,68,85],"conditionally":[55,80],"factorized":[56,81],"such":[57],"final":[60],"output,":[62],"which":[63],"may":[64,66],"or":[65],"not":[67],"code-switched,":[69],"is":[70],"obtained":[71],"given":[72],"only":[73],"information.":[75],"We":[76,93],"show":[77],"modeled":[86],"by":[87],"an":[88],"end-to-end":[89],"differentiable":[90],"neural":[91],"network.":[92],"demonstrate":[94],"efficacy":[96],"proposed":[99],"on":[101],"Mandarin-English":[103],"recognition":[105],"across":[106],"both":[107],"corpora.":[111]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
