{"id":"https://openalex.org/W4408358330","doi":"https://doi.org/10.1109/access.2025.3550855","title":"Advancements in Speech Recognition: A Systematic Review of Deep Learning Transformer Models, Trends, Innovations, and Future Directions","display_name":"Advancements in Speech Recognition: A Systematic Review of Deep Learning Transformer Models, Trends, Innovations, and Future Directions","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408358330","doi":"https://doi.org/10.1109/access.2025.3550855"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3550855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3550855","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"review","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3550855","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070704695","display_name":"Yousef Sharrab","orcid":"https://orcid.org/0000-0002-8710-7999"},"institutions":[{"id":"https://openalex.org/I92449659","display_name":"Isra University","ror":"https://ror.org/04d4bt482","country_code":"JO","type":"education","lineage":["https://openalex.org/I92449659"]}],"countries":["JO"],"is_corresponding":true,"raw_author_name":"Yousef O. Sharrab","raw_affiliation_strings":["Department of Data Science and Artificial Intelligence, Isra University, Amman, Jordan","Depatment of Data Science and Artificial Intelligence, Isra University, Amman, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Data Science and Artificial Intelligence, Isra University, Amman, Jordan","institution_ids":["https://openalex.org/I92449659"]},{"raw_affiliation_string":"Depatment of Data Science and Artificial Intelligence, Isra University, Amman, Jordan","institution_ids":["https://openalex.org/I92449659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049069083","display_name":"Hani Attar","orcid":"https://orcid.org/0000-0001-8028-7918"},"institutions":[{"id":"https://openalex.org/I153687341","display_name":"Zarqa University","ror":"https://ror.org/01wf1es90","country_code":"JO","type":"education","lineage":["https://openalex.org/I153687341"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Hani Attar","raw_affiliation_strings":["Faculty of Engineering, Zarqa University, Zarqa, Jordan","Faculty of Engineering, Zarqa university, Zarqa, Jordan"],"raw_orcid":"https://orcid.org/0000-0001-8028-7918","affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Zarqa University, Zarqa, Jordan","institution_ids":["https://openalex.org/I153687341"]},{"raw_affiliation_string":"Faculty of Engineering, Zarqa university, Zarqa, Jordan","institution_ids":["https://openalex.org/I153687341"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006234643","display_name":"Mohammad Ali H. Eljinini","orcid":"https://orcid.org/0000-0003-1680-2801"},"institutions":[{"id":"https://openalex.org/I92449659","display_name":"Isra University","ror":"https://ror.org/04d4bt482","country_code":"JO","type":"education","lineage":["https://openalex.org/I92449659"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Mohammad Ali H. Eljinini","raw_affiliation_strings":["Department of Computer Information Systems, Isra University, Amman, Jordan"],"raw_orcid":"https://orcid.org/0000-0003-1680-2801","affiliations":[{"raw_affiliation_string":"Department of Computer Information Systems, Isra University, Amman, Jordan","institution_ids":["https://openalex.org/I92449659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082813744","display_name":"Yasmin Al-Omary","orcid":null},"institutions":[{"id":"https://openalex.org/I156983542","display_name":"Jordan University of Science and Technology","ror":"https://ror.org/03y8mtb59","country_code":"JO","type":"education","lineage":["https://openalex.org/I156983542"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Yasmin Al-Omary","raw_affiliation_strings":["Department of Computer Science, Jordan University of Science and Technology, Irbid, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Jordan University of Science and Technology, Irbid, Jordan","institution_ids":["https://openalex.org/I156983542"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5116595233","display_name":"Wala\u2019a Al-Momani","orcid":null},"institutions":[{"id":"https://openalex.org/I156983542","display_name":"Jordan University of Science and Technology","ror":"https://ror.org/03y8mtb59","country_code":"JO","type":"education","lineage":["https://openalex.org/I156983542"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Wala\u2019A E. Al-Momani","raw_affiliation_strings":["Department of Computer Science, Jordan University of Science and Technology, Irbid, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Jordan University of Science and Technology, Irbid, Jordan","institution_ids":["https://openalex.org/I156983542"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5070704695"],"corresponding_institution_ids":["https://openalex.org/I92449659"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":27.1047,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.99492732,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"13","issue":null,"first_page":"46925","last_page":"46940"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9125999808311462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9125999808311462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6584194302558899},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5210944414138794},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5030292868614197},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3908722400665283},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3792659044265747},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1652611792087555},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.10204023122787476}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6584194302558899},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5210944414138794},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5030292868614197},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3908722400665283},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3792659044265747},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1652611792087555},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.10204023122787476},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3550855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3550855","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:466372c5c584488a87757a3cb9373e3f","is_oa":true,"landing_page_url":"https://doaj.org/article/466372c5c584488a87757a3cb9373e3f","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 46925-46940 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3550855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3550855","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320326306","display_name":"Zarqa University","ror":"https://ror.org/01wf1es90"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2781626870","https://openalex.org/W2981857663","https://openalex.org/W3015747801","https://openalex.org/W3015810689","https://openalex.org/W3016010032","https://openalex.org/W3157175643","https://openalex.org/W3162313915","https://openalex.org/W3206114047","https://openalex.org/W3207595101","https://openalex.org/W4205608408","https://openalex.org/W4210463634","https://openalex.org/W4221165942","https://openalex.org/W4223945715","https://openalex.org/W4224925623","https://openalex.org/W4225808286","https://openalex.org/W4226380987","https://openalex.org/W4226420874","https://openalex.org/W4283818106","https://openalex.org/W4317881096","https://openalex.org/W4327500526","https://openalex.org/W4379805013","https://openalex.org/W4385245566","https://openalex.org/W4385822429","https://openalex.org/W4385822766","https://openalex.org/W4385822815","https://openalex.org/W4391021542","https://openalex.org/W4391021623","https://openalex.org/W4392904027","https://openalex.org/W4393863141","https://openalex.org/W4399426355","https://openalex.org/W4400771889","https://openalex.org/W4412474694","https://openalex.org/W6770514103","https://openalex.org/W6853611000","https://openalex.org/W6857228344","https://openalex.org/W6857421307","https://openalex.org/W6866150908","https://openalex.org/W6866711220"],"related_works":["https://openalex.org/W2731899572","https://openalex.org/W3215138031","https://openalex.org/W3009238340","https://openalex.org/W4360585206","https://openalex.org/W4321369474","https://openalex.org/W4285208911","https://openalex.org/W3082895349","https://openalex.org/W4213079790","https://openalex.org/W2248239756","https://openalex.org/W3086377361"],"abstract_inverted_index":{"The":[0,46,80],"transformer":[1,58,160,233],"is":[2,223],"a":[3,117],"Deep":[4],"Learning":[5],"(DL)":[6],"model":[7,21,167,174],"that":[8,98],"revolutionized":[9],"language":[10],"processing":[11,18],"with":[12,183],"its":[13],"self-attention":[14],"mechanism,":[15],"enabling":[16],"parallel":[17],"and":[19,41,94,176,203],"improving":[20],"efficiency,":[22,168],"which":[23],"dramatically":[24],"reshaped":[25],"the":[26,34,39,55,64,68,88,129,142,150,159,169,194,201],"landscape":[27],"of":[28,44,57,82,109,153,158,171,197,205],"speech":[29,61,206,227],"recognition":[30,207,228],"technology,":[31],"based":[32],"on":[33,60,136,173],"ability":[35],"to":[36,76,86,123,128,186,225],"efficiently":[37],"manage":[38],"dynamic":[40],"context-rich":[42],"nature":[43],"speech.":[45],"proposed":[47],"systematic":[48],"review":[49,130,187,217],"in":[50,166,178,188,199,210],"this":[51,83,189,216],"article":[52,84],"critically":[53],"examines":[54],"impact":[56],"models":[59,161],"recognition,":[62],"covering":[63],"published":[65],"research":[66,96,222],"over":[67],"past":[69],"seven":[70,137],"years":[71],"(from":[72],"January":[73],"1,":[74],"2017,":[75],"May":[77],"15,":[78],"2024).":[79],"goals":[81],"are":[85],"synthesize":[87],"current":[89],"knowledge,":[90],"pinpoint":[91],"emerging":[92],"trends,":[93],"identify":[95],"gaps":[97],"could":[99],"be":[100],"beneficial":[101],"for":[102],"future":[103],"investigations.":[104],"From":[105],"an":[106],"initial":[107],"pool":[108],"2,838":[110],"publications":[111],"sourced":[112],"from":[113],"leading":[114],"digital":[115],"libraries,":[116],"rigorous":[118],"two-step":[119],"screening":[120],"process":[121],"applied":[122],"distill":[124],"high-quality":[125],"studies":[126],"relevant":[127],"criteria.":[131],"We":[132],"concentrated":[133],"our":[134],"analysis":[135],"pivotal":[138],"areas":[139,219],"as":[140],"following:":[141],"environmental":[143],"conditions":[144],"(neutral":[145],"versus":[146],"noisy)":[147],"addressed":[148],"by":[149,231],"studies,":[151],"methods":[152],"feature":[154],"extraction":[155],"employed,":[156],"characteristics":[157],"used,":[162],"datasets":[163],"utilized,":[164],"variations":[165],"influence":[170],"noise":[172],"generalizability,":[175],"trends":[177],"self-supervised":[179],"learning,":[180],"ending":[181],"up":[182],"37":[184],"articles":[185],"paper.":[190],"Our":[191],"findings":[192],"underscore":[193],"transformative":[195],"potential":[196],"transformers":[198],"enhancing":[200],"accuracy":[202],"robustness":[204],"systems,":[208],"especially":[209],"challenging":[211],"acoustic":[212],"environments.":[213],"In":[214],"addition,":[215],"highlights":[218],"where":[220],"more":[221],"needed":[224],"make":[226],"even":[229],"better":[230],"using":[232],"technology.":[234]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":10}],"updated_date":"2026-06-05T09:01:59.212387","created_date":"2025-10-10T00:00:00"}
