{"id":"https://openalex.org/W4372259807","doi":"https://doi.org/10.1109/icassp49357.2023.10095469","title":"CB-Conformer: Contextual Biasing Conformer for Biased Word Recognition","display_name":"CB-Conformer: Contextual Biasing Conformer for Biased Word Recognition","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372259807","doi":"https://doi.org/10.1109/icassp49357.2023.10095469"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10095469","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095469","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015396622","display_name":"Yaoxun Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yaoxun Xu","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010728849","display_name":"Baiji Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152717","display_name":"Mavenir (Israel)","ror":"https://ror.org/0507wc250","country_code":"IL","type":"company","lineage":["https://openalex.org/I4210152717"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Baiji Liu","raw_affiliation_strings":["XVerse Inc,Shenzhen,China","XVerse Inc, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"XVerse Inc,Shenzhen,China","institution_ids":["https://openalex.org/I4210152717"]},{"raw_affiliation_string":"XVerse Inc, Shenzhen, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008169830","display_name":"Qiaochu Huang","orcid":"https://orcid.org/0009-0004-8113-6459"},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiaochu Huang","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074833963","display_name":"Xingchen Song","orcid":"https://orcid.org/0009-0009-9516-5361"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingchen Song","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102869280","display_name":"Zhiyong Wu","orcid":"https://orcid.org/0000-0001-8533-0524"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Wu","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","The Chinese University of Hong Kong, Hong Kong SAR, China","Peng Cheng Lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]},{"raw_affiliation_string":"The Chinese University of Hong Kong, Hong Kong SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"Peng Cheng Lab, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083463839","display_name":"Shiyin Kang","orcid":"https://orcid.org/0000-0001-8304-5260"},"institutions":[{"id":"https://openalex.org/I4210152717","display_name":"Mavenir (Israel)","ror":"https://ror.org/0507wc250","country_code":"IL","type":"company","lineage":["https://openalex.org/I4210152717"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Shiyin Kang","raw_affiliation_strings":["XVerse Inc,Shenzhen,China","XVerse Inc, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"XVerse Inc,Shenzhen,China","institution_ids":["https://openalex.org/I4210152717"]},{"raw_affiliation_string":"XVerse Inc, Shenzhen, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019458385","display_name":"Helen Meng","orcid":"https://orcid.org/0000-0002-4427-3532"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Helen Meng","raw_affiliation_strings":["The Chinese University of Hong Kong,Hong Kong SAR,China","The Chinese University of Hong Kong, Hong Kong SAR, China"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong,Hong Kong SAR,China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"The Chinese University of Hong Kong, Hong Kong SAR, China","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5015396622"],"corresponding_institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.2166,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.82781598,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.749970555305481},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6600707173347473},{"id":"https://openalex.org/keywords/biasing","display_name":"Biasing","score":0.6570928692817688},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6497114300727844},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5835519433021545},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5538250803947449},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5300678610801697},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5270441174507141},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.5248416066169739},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5144384503364563},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4851565957069397},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.44692322611808777},{"id":"https://openalex.org/keywords/conformational-isomerism","display_name":"Conformational isomerism","score":0.4118383526802063},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1677328646183014},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.16485583782196045},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.15349560976028442},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.10214495658874512}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.749970555305481},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6600707173347473},{"id":"https://openalex.org/C20254490","wikidata":"https://www.wikidata.org/wiki/Q719550","display_name":"Biasing","level":3,"score":0.6570928692817688},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6497114300727844},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5835519433021545},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5538250803947449},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5300678610801697},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5270441174507141},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.5248416066169739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5144384503364563},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4851565957069397},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.44692322611808777},{"id":"https://openalex.org/C18705241","wikidata":"https://www.wikidata.org/wiki/Q1128023","display_name":"Conformational isomerism","level":3,"score":0.4118383526802063},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1677328646183014},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.16485583782196045},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.15349560976028442},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.10214495658874512},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C32909587","wikidata":"https://www.wikidata.org/wiki/Q11369","display_name":"Molecule","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10095469","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095469","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2046932483","https://openalex.org/W2962760690","https://openalex.org/W2963240019","https://openalex.org/W2963364041","https://openalex.org/W2972625221","https://openalex.org/W3006752097","https://openalex.org/W3008174054","https://openalex.org/W3015927303","https://openalex.org/W3097777922","https://openalex.org/W3140235797","https://openalex.org/W3152221657","https://openalex.org/W3163462603","https://openalex.org/W3197478142","https://openalex.org/W3197661863","https://openalex.org/W3198439131","https://openalex.org/W3202725408","https://openalex.org/W3203407300","https://openalex.org/W3205201903","https://openalex.org/W3211278025","https://openalex.org/W4220871331","https://openalex.org/W4224918838","https://openalex.org/W4225289150","https://openalex.org/W4319862695","https://openalex.org/W4385245566","https://openalex.org/W6739901393","https://openalex.org/W6810422493"],"related_works":["https://openalex.org/W2594897229","https://openalex.org/W2151348424","https://openalex.org/W4221142855","https://openalex.org/W2050138804","https://openalex.org/W2129812225","https://openalex.org/W4290708361","https://openalex.org/W2523799048","https://openalex.org/W2155620340","https://openalex.org/W1494910745","https://openalex.org/W2114358883"],"abstract_inverted_index":{"Due":[0],"to":[1,11,18,55,67,83],"the":[2,5,14,20,23,29,74,79,102,110,135,141,188],"mismatch":[3],"between":[4],"source":[6],"and":[7,58,78,93,120,130,150,179],"target":[8,30],"domains,":[9],"how":[10],"better":[12],"utilize":[13],"biased":[15,69,114,128,175,182],"word":[16,70,176,183],"information":[17],"improve":[19,68],"performance":[21],"of":[22,101,113],"automatic":[24,136],"speech":[25,137],"recognition":[26,71,138],"model":[27,46,99,139],"in":[28,123],"domain":[31],"becomes":[32],"a":[33,42,49,124,167,173,180],"hot":[34],"research":[35],"topic.":[36],"Previous":[37],"approaches":[38],"either":[39],"decode":[40],"with":[41,96,134,187],"fixed":[43,143],"external":[44],"language":[45,144],"or":[47],"introduce":[48],"sizeable":[50],"biasing":[51],"module,":[52],"which":[53],"leads":[54],"poor":[56],"adaptability":[57],"slow":[59],"inference.":[60],"In":[61,146],"this":[62],"work,":[63],"we":[64,148],"propose":[65],"CB-Conformer":[66],"by":[72],"introducing":[73],"Contextual":[75,87],"Biasing":[76,88],"Module":[77,89],"Self-Adaptive":[80,106],"Language":[81,107],"Model":[82,108],"vanilla":[84],"Conformer.":[85,104,190],"The":[86,105],"combines":[90],"audio":[91],"fragments":[92],"contextual":[94],"information,":[95],"only":[97],"0.2%":[98],"parameters":[100],"original":[103],"modifies":[109],"internal":[111],"weights":[112],"words":[115,129],"based":[116,157],"on":[117,127,158],"their":[118],"recall":[119,177],"precision,":[121],"resulting":[122],"greater":[125],"focus":[126],"more":[131],"successful":[132],"integration":[133],"than":[140],"standard":[142],"model.":[145],"addition,":[147],"construct":[149],"release":[151],"an":[152],"open-source":[153],"Mandarin":[154],"biased-word":[155],"dataset":[156],"WenetSpeech.":[159],"Experiments":[160],"indicate":[161],"that":[162],"our":[163],"proposed":[164],"method":[165],"brings":[166],"15.34%":[168],"character":[169],"error":[170],"rate":[171],"reduction,":[172],"14.13%":[174],"increase,":[178],"6.80%":[181],"F1-score":[184],"increase":[185],"compared":[186],"base":[189]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
