{"id":"https://openalex.org/W7140369410","doi":"https://doi.org/10.48550/arxiv.2603.23654","title":"Ethio-ASR: Joint Multilingual Speech Recognition and Language Identification for Ethiopian Languages","display_name":"Ethio-ASR: Joint Multilingual Speech Recognition and Language Identification for Ethiopian Languages","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140369410","doi":"https://doi.org/10.48550/arxiv.2603.23654"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.23654","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23654","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.23654","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111310853","display_name":"Badr M. Abdullah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdullah, Badr M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013873474","display_name":"Israel Abebe Azime","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Azime, Israel Abebe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130701434","display_name":"Atnafu Lambebo Tonja","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tonja, Atnafu Lambebo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055769964","display_name":"Jesujoba O. Alabi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alabi, Jesujoba O.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130675508","display_name":"Abel Mulat Alemu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alemu, Abel Mulat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130655806","display_name":"Eyob G. Hagos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hagos, Eyob G.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099096832","display_name":"Bontu Fufa Balcha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balcha, Bontu Fufa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130710134","display_name":"Mulubrhan A. Nerea","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nerea, Mulubrhan A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114653388","display_name":"Debela Desalegn Yadeta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yadeta, Debela Desalegn","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120308310","display_name":"Dagnachew Mekonnen Marilign","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marilign, Dagnachew Mekonnen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130685317","display_name":"Amanuel Temesgen Fentahun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fentahun, Amanuel Temesgen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130631618","display_name":"Tadesse Kebede","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kebede, Tadesse","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072548521","display_name":"Israel D. Gebru","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gebru, Israel D.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077821129","display_name":"Michael Melese Woldeyohannis","orcid":"https://orcid.org/0000-0002-1532-6885"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Woldeyohannis, Michael Melese","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011399695","display_name":"Walelign Tewabe Sewunetie","orcid":"https://orcid.org/0000-0003-2787-8019"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sewunetie, Walelign Tewabe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047761609","display_name":"Bernd M\u00f6bius","orcid":"https://orcid.org/0000-0003-3065-9984"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"M\u00f6bius, Bernd","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130638257","display_name":"Dietrich Klakow","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klakow, Dietrich","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":17,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.018400000408291817,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.005100000184029341,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.5771999955177307},{"id":"https://openalex.org/keywords/consonant","display_name":"Consonant","score":0.4505000114440918},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.4287000000476837},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.412200003862381},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4108999967575073},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3944000005722046},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.3750999867916107},{"id":"https://openalex.org/keywords/speech-technology","display_name":"Speech technology","score":0.3424000144004822}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.755299985408783},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6330999732017517},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.5771999955177307},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5496000051498413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49470001459121704},{"id":"https://openalex.org/C2778203577","wikidata":"https://www.wikidata.org/wiki/Q38035","display_name":"Consonant","level":3,"score":0.4505000114440918},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.4287000000476837},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.412200003862381},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4108999967575073},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3944000005722046},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.3750999867916107},{"id":"https://openalex.org/C504749915","wikidata":"https://www.wikidata.org/wiki/Q9010971","display_name":"Speech technology","level":3,"score":0.3424000144004822},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.32019999623298645},{"id":"https://openalex.org/C129792486","wikidata":"https://www.wikidata.org/wiki/Q1050419","display_name":"Language identification","level":3,"score":0.3003999888896942},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.260699987411499},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.25209999084472656},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.23654","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23654","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.23654","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23654","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5294681787490845},{"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality","score":0.40948420763015747}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,56,102],"present":[1],"Ethio-ASR,":[2],"a":[3,105],"suite":[4],"of":[5,35,53,86,108,113,126],"multilingual":[6,75,127],"CTC-based":[7],"automatic":[8],"speech":[9,44,69],"recognition":[10],"(ASR)":[11],"models":[12,59,131],"jointly":[13],"trained":[14],"on":[15,60,88],"five":[16],"Ethiopian":[17],"languages:":[18],"Amharic,":[19],"Tigrinya,":[20],"Oromo,":[21],"Sidaama,":[22],"and":[23,32,39,71,116,122,132],"Wolaytta.":[24],"These":[25],"languages":[26],"belong":[27],"to":[28,119,137],"the":[29,36,50,61,89,94,111,123,138],"Semitic,":[30],"Cushitic,":[31],"Omotic":[33],"branches":[34],"Afroasiatic":[37],"family,":[38],"remain":[40],"severely":[41],"underrepresented":[42],"in":[43],"technology":[45],"despite":[46],"being":[47],"spoken":[48],"by":[49],"vast":[51],"majority":[52],"Ethiopia's":[54],"population.":[55],"train":[57],"our":[58],"recently":[62],"released":[63],"WAXAL":[64,90],"corpus":[65],"using":[66],"several":[67],"pre-trained":[68],"encoders":[70],"evaluate":[72],"against":[73],"strong":[74],"baselines,":[76],"including":[77],"OmniASR.":[78],"Our":[79,130],"best":[80,95],"model":[81,97],"achieves":[82],"an":[83],"average":[84],"WER":[85],"30.48%":[87],"test":[91],"set,":[92],"outperforming":[93],"OmniASR":[96],"with":[98],"substantially":[99],"fewer":[100],"parameters.":[101],"further":[103],"provide":[104],"comprehensive":[106],"analysis":[107],"gender":[109],"bias,":[110],"contribution":[112],"vowel":[114],"length":[115],"consonant":[117],"gemination":[118],"ASR":[120],"errors,":[121],"training":[124],"dynamics":[125],"CTC":[128],"models.":[129],"codebase":[133],"are":[134],"publicly":[135],"available":[136],"research":[139],"community.":[140]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-27T00:00:00"}
