{"id":"https://openalex.org/W7139928972","doi":"https://doi.org/10.1016/j.procs.2026.01.037","title":"Confidence Gated Fusion: Dynamic Language Model Integration for Adapting Pretrained Multilingual ASR Models with Text-Only Data","display_name":"Confidence Gated Fusion: Dynamic Language Model Integration for Adapting Pretrained Multilingual ASR Models with Text-Only Data","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139928972","doi":"https://doi.org/10.1016/j.procs.2026.01.037"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.037","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.037","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.037","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084315604","display_name":"Nader Essam","orcid":null},"institutions":[{"id":"https://openalex.org/I145487455","display_name":"Cairo University","ror":"https://ror.org/03q21mh05","country_code":"EG","type":"education","lineage":["https://openalex.org/I145487455"]}],"countries":["EG"],"is_corresponding":true,"raw_author_name":"Nader Essam","raw_affiliation_strings":["Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt"],"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt","institution_ids":["https://openalex.org/I145487455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130228301","display_name":"Wael Ali","orcid":null},"institutions":[{"id":"https://openalex.org/I207547235","display_name":"Benha University","ror":"https://ror.org/03tn5ee41","country_code":"EG","type":"education","lineage":["https://openalex.org/I207547235"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Wael Ali","raw_affiliation_strings":["Faculty of Engineering at Benha, Benha University, Benha, Egypt"],"affiliations":[{"raw_affiliation_string":"Faculty of Engineering at Benha, Benha University, Benha, Egypt","institution_ids":["https://openalex.org/I207547235"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027622725","display_name":"Khaled Wassif","orcid":"https://orcid.org/0000-0002-7401-5219"},"institutions":[{"id":"https://openalex.org/I145487455","display_name":"Cairo University","ror":"https://ror.org/03q21mh05","country_code":"EG","type":"education","lineage":["https://openalex.org/I145487455"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Khaled Wassif","raw_affiliation_strings":["Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt"],"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt","institution_ids":["https://openalex.org/I145487455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130216032","display_name":"Sherif Mahdy Abdou Essawy","orcid":null},"institutions":[{"id":"https://openalex.org/I145487455","display_name":"Cairo University","ror":"https://ror.org/03q21mh05","country_code":"EG","type":"education","lineage":["https://openalex.org/I145487455"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Sherif Mahdy Abdou Essawy","raw_affiliation_strings":["Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt"],"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt","institution_ids":["https://openalex.org/I145487455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130229986","display_name":"Hanaa Mobarz","orcid":null},"institutions":[{"id":"https://openalex.org/I145487455","display_name":"Cairo University","ror":"https://ror.org/03q21mh05","country_code":"EG","type":"education","lineage":["https://openalex.org/I145487455"]},{"id":"https://openalex.org/I186217134","display_name":"Future University in Egypt","ror":"https://ror.org/03s8c2x09","country_code":"EG","type":"education","lineage":["https://openalex.org/I186217134"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Hanaa Mobarz","raw_affiliation_strings":["Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt","Faculty of Computers and Information Technology, Future University, Cairo, Egypt"],"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Artificial Intelligence, Cairo University, Giza, Egypt","institution_ids":["https://openalex.org/I145487455"]},{"raw_affiliation_string":"Faculty of Computers and Information Technology, Future University, Cairo, Egypt","institution_ids":["https://openalex.org/I186217134"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5084315604"],"corresponding_institution_ids":["https://openalex.org/I145487455"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93188838,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"301","last_page":"308"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.5788999795913696,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.5788999795913696,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.14630000293254852,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.12880000472068787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6345000267028809},{"id":"https://openalex.org/keywords/language-understanding","display_name":"Language understanding","score":0.33410000801086426},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.29280000925064087},{"id":"https://openalex.org/keywords/dynamic-data","display_name":"Dynamic data","score":0.2881999909877777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9330999851226807},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6345000267028809},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5530999898910522},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5306000113487244},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4456000030040741},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.33410000801086426},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C197298091","wikidata":"https://www.wikidata.org/wiki/Q5318963","display_name":"Dynamic data","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2662000060081482},{"id":"https://openalex.org/C100463513","wikidata":"https://www.wikidata.org/wiki/Q5227322","display_name":"Data model (GIS)","level":2,"score":0.23280000686645508}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.037","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.037","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.037","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.037","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2577366047","https://openalex.org/W2766219058","https://openalex.org/W2799800213","https://openalex.org/W3008037978","https://openalex.org/W3198439131","https://openalex.org/W4297347714","https://openalex.org/W4322732039","https://openalex.org/W4388017359","https://openalex.org/W4404792897"],"related_works":[],"abstract_inverted_index":{"Pretrained":[0],"multilingual":[1],"End-to-End":[2],"(E2E)":[3],"Automatic":[4],"Speech":[5],"Recognition":[6],"(ASR)":[7],"models":[8,156],"demonstrate":[9],"remarkable":[10],"capabilities":[11],"but":[12],"struggle":[13],"with":[14,141],"domain-specific":[15,109],"terminologies":[16],"and":[17,102,121,153],"underrepresented":[18],"dialects.":[19],"Fine-tuning":[20],"requires":[21],"expensive":[22,71],"paired":[23],"audio-transcript":[24],"data,":[25],"creating":[26],"barriers":[27],"to":[28,113,133],"practical":[29],"adaptation.":[30],"This":[31],"paper":[32],"investigates":[33],"language":[34],"model":[35,67,89],"(LM)":[36],"integration":[37],"via":[38],"shallow":[39,78],"fusion":[40],"as":[41],"an":[42],"efficient,":[43],"text-only":[44],"adaptation":[45],"method.":[46],"We":[47,80],"introduce":[48],"Confidence":[49],"Gated":[50],"Fusion":[51],"(CGF),":[52],"a":[53,103,108],"novel":[54],"approach":[55,83],"that":[56],"dynamically":[57],"determines":[58],"the":[59,70,124],"LM":[60,110],"weight":[61],"during":[62],"decoding":[63],"based":[64],"on":[65,91,118,123,151,154],"ASR":[66],"uncertainty,":[68],"eliminating":[69],"validation-set-dependent":[72],"grid":[73],"search":[74],"required":[75],"by":[76],"traditional":[77],"fusion.":[79],"validate":[81],"our":[82],"using":[84],"OpenAI\u2019s":[85],"Whisper":[86],"across":[87],"multiple":[88],"sizes":[90],"Arabic":[92,97],"ASR,":[93],"evaluating":[94],"Modern":[95],"Standard":[96],"(MSA),":[98],"Egyptian":[99],"dialect":[100],"(EGY),":[101],"specialized":[104,145],"judiciary":[105,125],"domain.":[106,126],"Integrating":[107],"achieved":[111,130],"up":[112],"40.92%":[114],"relative":[115,148],"WER":[116,149],"reduction":[117,150],"dialectal":[119],"speech":[120],"32.96%":[122],"Our":[127],"CGF":[128],"method":[129],"comparable":[131],"performance":[132],"tuned":[134],"baselines":[135],"while":[136],"requiring":[137],"no":[138],"hyperparameter":[139],"optimization,":[140],"particular":[142],"advantages":[143],"in":[144],"domains":[146],"(28.92%":[147],"judiciary)":[152],"smaller":[155],"where":[157],"static":[158],"weights":[159],"often":[160],"lack":[161],"robustness.":[162]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
