{"id":"https://openalex.org/W7139926358","doi":"https://doi.org/10.1016/j.procs.2026.01.063","title":"End-to-End Conformer Neural Networks for Multilingual Automatic Speech Recognition and Understanding","display_name":"End-to-End Conformer Neural Networks for Multilingual Automatic Speech Recognition and Understanding","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139926358","doi":"https://doi.org/10.1016/j.procs.2026.01.063"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.063","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.063","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130227432","display_name":"Hassan AlMashhadani","orcid":null},"institutions":[{"id":"https://openalex.org/I12150220","display_name":"University of Mosul","ror":"https://ror.org/039cf4q47","country_code":"IQ","type":"education","lineage":["https://openalex.org/I12150220"]}],"countries":["IQ"],"is_corresponding":true,"raw_author_name":"Hassan AlMashhadani","raw_affiliation_strings":["Dept. Of Artificial Intelligence. College of Computer science and Mathematics, University of Mosul-Iraq"],"affiliations":[{"raw_affiliation_string":"Dept. Of Artificial Intelligence. College of Computer science and Mathematics, University of Mosul-Iraq","institution_ids":["https://openalex.org/I12150220"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128499731","display_name":"Alaa Alsaffar","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145266","display_name":"Southern Technical University","ror":"https://ror.org/03sax3264","country_code":"IQ","type":"education","lineage":["https://openalex.org/I4210145266"]}],"countries":["IQ"],"is_corresponding":false,"raw_author_name":"Alaa A. Alsaffar","raw_affiliation_strings":["AlKunooze University College of Technical Engineering, Basrah, Iraq"],"affiliations":[{"raw_affiliation_string":"AlKunooze University College of Technical Engineering, Basrah, Iraq","institution_ids":["https://openalex.org/I4210145266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130218001","display_name":"Hillal Ali AlMaqbali","orcid":null},"institutions":[{"id":"https://openalex.org/I45998257","display_name":"Sohar University","ror":"https://ror.org/02ftvf862","country_code":"OM","type":"education","lineage":["https://openalex.org/I45998257"]}],"countries":["OM"],"is_corresponding":false,"raw_author_name":"Hillal Ali AlMaqbali","raw_affiliation_strings":["College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman"],"affiliations":[{"raw_affiliation_string":"College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman","institution_ids":["https://openalex.org/I45998257"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130213842","display_name":"Ahmed Al-Amayreh","orcid":null},"institutions":[{"id":"https://openalex.org/I45998257","display_name":"Sohar University","ror":"https://ror.org/02ftvf862","country_code":"OM","type":"education","lineage":["https://openalex.org/I45998257"]}],"countries":["OM"],"is_corresponding":false,"raw_author_name":"Ahmed Al-Amayreh","raw_affiliation_strings":["College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman"],"affiliations":[{"raw_affiliation_string":"College of Computing and IT, University of Technology and Applied Sciences, Suhar, Oman","institution_ids":["https://openalex.org/I45998257"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5130227432"],"corresponding_institution_ids":["https://openalex.org/I12150220"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93147051,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"541","last_page":"549"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.48910000920295715,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.48910000920295715,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.05689999833703041,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.052799999713897705,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5175999999046326},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.3630000054836273},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2953999936580658},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.2705000042915344},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.2596000134944916}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9107000231742859},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6018999814987183},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5307999849319458},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5175999999046326},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5058000087738037},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3630000054836273},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.2705000042915344},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C175202392","wikidata":"https://www.wikidata.org/wiki/Q2434543","display_name":"Time delay neural network","level":3,"score":0.2371000051498413}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.063","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.063","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.4197138845920563}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W3183219652","https://openalex.org/W4200313634","https://openalex.org/W4206037047","https://openalex.org/W4210475104","https://openalex.org/W4304013688","https://openalex.org/W4319660698","https://openalex.org/W4320060058","https://openalex.org/W4320498290","https://openalex.org/W4376141778","https://openalex.org/W4378227633","https://openalex.org/W4379387938","https://openalex.org/W4385994195","https://openalex.org/W4389104939","https://openalex.org/W4391402564","https://openalex.org/W4398197972","https://openalex.org/W4398199915","https://openalex.org/W4398199933","https://openalex.org/W4398199977","https://openalex.org/W4399457811","https://openalex.org/W4401948251","https://openalex.org/W4403104615","https://openalex.org/W4403111421","https://openalex.org/W4403111444","https://openalex.org/W4403267782","https://openalex.org/W4403558103","https://openalex.org/W4404186213","https://openalex.org/W4405062006","https://openalex.org/W4405065223","https://openalex.org/W4406125273","https://openalex.org/W4406416056","https://openalex.org/W4406435604","https://openalex.org/W4406525077","https://openalex.org/W4407040299","https://openalex.org/W4407382954","https://openalex.org/W4407383828","https://openalex.org/W4407775092","https://openalex.org/W4407955656","https://openalex.org/W4408059677","https://openalex.org/W4408128024","https://openalex.org/W4408164402","https://openalex.org/W4408313718","https://openalex.org/W4408589440","https://openalex.org/W4409426354","https://openalex.org/W4410045251"],"related_works":[],"abstract_inverted_index":{"Educational":[0],"and":[1,10,19,30,53,76,90,100,113,123,131,141,161],"e-learning":[2,111,154],"environments":[3],"must":[4],"incorporate":[5],"Spoken":[6],"Language":[7],"Understanding":[8],"(SLU)":[9],"Automatic":[11],"Speech":[12],"Recognition":[13],"(ASR)":[14],"to":[15],"ensure":[16],"accessible,":[17],"scalable,":[18],"inclusive":[20],"digital":[21],"learning.":[22],"Existing":[23],"algorithms":[24],"struggle":[25],"with":[26],"low-resource":[27,138],"languages,":[28,81],"accents,":[29],"linguistic":[31],"variety,":[32],"making":[33],"them":[34],"unsuitable":[35],"for":[36,50,73,86,92,148],"real-world":[37],"multilingual":[38,104,158],"educational":[39,105],"environments.":[40],"Therefore,":[41],"this":[42],"study":[43],"proposes":[44],"EduLinguaNet,":[45],"a":[46],"Multilingual":[47],"Conformer":[48,69],"Network":[49],"online":[51],"classes":[52],"schools,":[54],"which":[55],"solves":[56],"these":[57],"issues":[58],"in":[59,128,137],"accurate":[60],"speech":[61,159],"detection.":[62],"The":[63,95],"proposed":[64,96],"EduLinguaNet":[65,120,152],"employs":[66],"an":[67],"end-to-end":[68],"Neural":[70,125],"network":[71],"architecture":[72],"precise":[74],"translation":[75],"semantic":[77],"comprehension":[78],"across":[79],"multiple":[80],"utilizing":[82,102],"layer-by-layer":[83],"neural":[84],"networks":[85],"local":[87],"feature":[88],"modeling":[89],"self-attention":[91],"long-distance":[93],"interactions.":[94],"model":[97],"is":[98],"trained":[99],"assessed":[101],"large-scale":[103],"corpora,":[106],"language":[107,139],"learning":[108],"platforms,":[109],"interactive":[110],"sessions,":[112],"lecture":[114],"recordings.":[115],"Experimental":[116],"data":[117],"show":[118],"that":[119],"outperforms":[121],"Transformers":[122],"Recurrent":[124],"Networks":[126],"(RNNs)":[127],"intent":[129],"recognition":[130],"Word":[132],"Error":[133],"Rate":[134],"(WER).":[135],"Robustness":[136],"settings":[140],"code-switching":[142],"performance":[143],"indicate":[144],"the":[145],"system\u2019s":[146],"adaptability":[147],"diverse":[149],"learners.":[150],"Finally,":[151],"improves":[153],"via":[155],"accurate,":[156],"real-time,":[157],"detection":[160],"interpretation.":[162]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
