{"id":"https://openalex.org/W4403869528","doi":"https://doi.org/10.3390/make6040120","title":"Lexical Error Guard: Leveraging Large Language Models for Enhanced ASR Error Correction","display_name":"Lexical Error Guard: Leveraging Large Language Models for Enhanced ASR Error Correction","publication_year":2024,"publication_date":"2024-10-29","ids":{"openalex":"https://openalex.org/W4403869528","doi":"https://doi.org/10.3390/make6040120"},"language":"en","primary_location":{"id":"doi:10.3390/make6040120","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make6040120","pdf_url":"https://www.mdpi.com/2504-4990/6/4/120/pdf?version=1730205508","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-4990/6/4/120/pdf?version=1730205508","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008865789","display_name":"Mei Si","orcid":"https://orcid.org/0000-0001-8642-8806"},"institutions":[{"id":"https://openalex.org/I165799507","display_name":"Rensselaer Polytechnic Institute","ror":"https://ror.org/01rtyzb94","country_code":"US","type":"education","lineage":["https://openalex.org/I165799507"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mei Si","raw_affiliation_strings":["Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA"],"raw_orcid":"https://orcid.org/0000-0001-8642-8806","affiliations":[{"raw_affiliation_string":"Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","institution_ids":["https://openalex.org/I165799507"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114446297","display_name":"Omar Cobas","orcid":null},"institutions":[{"id":"https://openalex.org/I165799507","display_name":"Rensselaer Polytechnic Institute","ror":"https://ror.org/01rtyzb94","country_code":"US","type":"education","lineage":["https://openalex.org/I165799507"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Omar Cobas","raw_affiliation_strings":["Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","Department of Computer Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","institution_ids":["https://openalex.org/I165799507"]},{"raw_affiliation_string":"Department of Computer Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","institution_ids":["https://openalex.org/I165799507"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114446298","display_name":"Michael Fababeir","orcid":null},"institutions":[{"id":"https://openalex.org/I165799507","display_name":"Rensselaer Polytechnic Institute","ror":"https://ror.org/01rtyzb94","country_code":"US","type":"education","lineage":["https://openalex.org/I165799507"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Fababeir","raw_affiliation_strings":["Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","Department of Computer Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Cognitive Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","institution_ids":["https://openalex.org/I165799507"]},{"raw_affiliation_string":"Department of Computer Science, Rensselaer Polytechnic Institute, Troy, NY 12180, USA","institution_ids":["https://openalex.org/I165799507"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5008865789"],"corresponding_institution_ids":["https://openalex.org/I165799507"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.6508,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.75616257,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"6","issue":"4","first_page":"2435","last_page":"2446"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7660396099090576},{"id":"https://openalex.org/keywords/guard","display_name":"Guard (computer science)","score":0.6981226801872253},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.6212997436523438},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5025613307952881},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4851711392402649},{"id":"https://openalex.org/keywords/error-analysis","display_name":"Error analysis","score":0.42364221811294556},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36542218923568726},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2516319155693054},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.20996850728988647},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08700883388519287}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7660396099090576},{"id":"https://openalex.org/C141141315","wikidata":"https://www.wikidata.org/wiki/Q2379942","display_name":"Guard (computer science)","level":2,"score":0.6981226801872253},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.6212997436523438},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5025613307952881},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4851711392402649},{"id":"https://openalex.org/C3018824978","wikidata":"https://www.wikidata.org/wiki/Q2894891","display_name":"Error analysis","level":2,"score":0.42364221811294556},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36542218923568726},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2516319155693054},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20996850728988647},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08700883388519287},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/make6040120","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make6040120","pdf_url":"https://www.mdpi.com/2504-4990/6/4/120/pdf?version=1730205508","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:64b3c367946b4d8a859eba821ff4e19d","is_oa":false,"landing_page_url":"https://doaj.org/article/64b3c367946b4d8a859eba821ff4e19d","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning and Knowledge Extraction, Vol 6, Iss 4, Pp 2435-2446 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/make6040120","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make6040120","pdf_url":"https://www.mdpi.com/2504-4990/6/4/120/pdf?version=1730205508","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.75}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4403869528.pdf","grobid_xml":"https://content.openalex.org/works/W4403869528.grobid-xml"},"referenced_works_count":19,"referenced_works":["https://openalex.org/W38194800","https://openalex.org/W1494198834","https://openalex.org/W3024308166","https://openalex.org/W3034775979","https://openalex.org/W3036601975","https://openalex.org/W3097777922","https://openalex.org/W3158699857","https://openalex.org/W3197797812","https://openalex.org/W4200629210","https://openalex.org/W4221160683","https://openalex.org/W4292779060","https://openalex.org/W4311000453","https://openalex.org/W4385822949","https://openalex.org/W4385823363","https://openalex.org/W4391021773","https://openalex.org/W4392931626","https://openalex.org/W4402112422","https://openalex.org/W6778883912","https://openalex.org/W6780218876"],"related_works":["https://openalex.org/W4254637722","https://openalex.org/W2980401999","https://openalex.org/W3016483420","https://openalex.org/W2331628363","https://openalex.org/W2393030234","https://openalex.org/W2379730136","https://openalex.org/W2380243770","https://openalex.org/W2377495875","https://openalex.org/W2390973415","https://openalex.org/W2074837817"],"abstract_inverted_index":{"Error":[0,43],"correction":[1,19,66],"is":[2,21,78],"a":[3,74,119],"vital":[4],"element":[5],"in":[6,114],"modern":[7],"automatic":[8],"speech":[9],"recognition":[10],"(ASR)":[11],"systems.":[12],"A":[13],"significant":[14],"portion":[15],"of":[16,52,89],"ASR":[17,26,37,71,104],"error":[18,65],"work":[20],"closely":[22],"integrated":[23],"within":[24],"specific":[25],"systems,":[27],"which":[28,46],"creates":[29],"challenges":[30],"for":[31,130,142],"adapting":[32],"these":[33],"solutions":[34],"to":[35,61,85,123,153],"different":[36],"frameworks.":[38],"This":[39],"research":[40],"introduces":[41],"Lexical":[42],"Guard":[44],"(LEG),":[45],"leverages":[47],"the":[48,90,94,98,126,138],"extensive":[49],"pre-trained":[50],"knowledge":[51],"large":[53],"language":[54],"models":[55],"(LLMs)":[56],"and":[57],"employs":[58],"instructional":[59],"learning":[60],"create":[62],"an":[63],"adaptable":[64],"system":[67],"compatible":[68],"with":[69,108,118,133,145],"various":[70,109],"platforms.":[72],"Additionally,":[73],"parameter-efficient":[75],"fine-tuning":[76],"method":[77],"utilized":[79],"using":[80],"quantized":[81],"low-rank":[82],"adaptation":[83],"(QLoRA)":[84],"facilitate":[86],"fast":[87],"training":[88],"system.":[91],"Tested":[92],"on":[93,125,137],"LibriSpeech":[95],"data":[96],"corpus,":[97],"results":[99,105],"indicate":[100],"that":[101],"LEG":[102],"improves":[103],"when":[106],"used":[107],"Whisper":[110,131,143],"model":[111],"sizes.":[112],"Improvements":[113,136],"WER":[115],"are":[116,148],"made,":[117,150],"decrease":[120],"from":[121,151],"2.27%":[122],"2.21%":[124],"\u201cTest":[127,139],"Clean\u201d":[128],"dataset":[129,141],"Large":[132,144],"beam":[134,146],"search.":[135],"Other\u201d":[140],"search":[147],"also":[149],"4.93%":[152],"4.72%.":[154]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
