{"id":"https://openalex.org/W4377298277","doi":"https://doi.org/10.48550/arxiv.2305.11244","title":"A Parameter-Efficient Learning Approach to Arabic Dialect Identification with Pre-Trained General-Purpose Speech Model","display_name":"A Parameter-Efficient Learning Approach to Arabic Dialect Identification with Pre-Trained General-Purpose Speech Model","publication_year":2023,"publication_date":"2023-05-18","ids":{"openalex":"https://openalex.org/W4377298277","doi":"https://doi.org/10.48550/arxiv.2305.11244"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2305.11244","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11244","pdf_url":"https://arxiv.org/pdf/2305.11244","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2305.11244","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027982192","display_name":"Srijith Radhakrishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]},{"id":"https://openalex.org/I164861460","display_name":"Manipal Academy of Higher Education","ror":"https://ror.org/02xzytt36","country_code":"IN","type":"education","lineage":["https://openalex.org/I164861460"]}],"countries":["IN","SA"],"is_corresponding":true,"raw_author_name":"Radhakrishnan, Srijith","raw_affiliation_strings":["SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;","Manipal Institute of Technology, India;","King Abdullah University of Science and Technology, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;","institution_ids":[]},{"raw_affiliation_string":"Manipal Institute of Technology, India;","institution_ids":["https://openalex.org/I164861460"]},{"raw_affiliation_string":"King Abdullah University of Science and Technology, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020376803","display_name":"Chao-Han Huck Yang","orcid":"https://orcid.org/0000-0003-2879-8811"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]},{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA","US"],"is_corresponding":false,"raw_author_name":"Yang, Chao-Han Huck","raw_affiliation_strings":["King Abdullah University of Science and Technology, Saudi Arabia","Georgia Institute of Technology, USA;"],"affiliations":[{"raw_affiliation_string":"King Abdullah University of Science and Technology, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]},{"raw_affiliation_string":"Georgia Institute of Technology, USA;","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000405517","display_name":"Sumeer Ahmad Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Khan, Sumeer Ahmad","raw_affiliation_strings":["SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;","King Abdullah University of Science and Technology, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;","institution_ids":[]},{"raw_affiliation_string":"King Abdullah University of Science and Technology, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055536778","display_name":"Narsis A. Kiani","orcid":"https://orcid.org/0000-0002-0949-046X"},"institutions":[{"id":"https://openalex.org/I28166907","display_name":"Karolinska Institutet","ror":"https://ror.org/056d84691","country_code":"SE","type":"education","lineage":["https://openalex.org/I28166907"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Kiani, Narsis A.","raw_affiliation_strings":["Karolinska Institutet, Sweden"],"affiliations":[{"raw_affiliation_string":"Karolinska Institutet, Sweden","institution_ids":["https://openalex.org/I28166907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078466508","display_name":"David G\u00f3mez-Cabrero","orcid":"https://orcid.org/0000-0003-4186-3788"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Gomez-Cabrero, David","raw_affiliation_strings":["King Abdullah University of Science and Technology, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"King Abdullah University of Science and Technology, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035252549","display_name":"Jesper Tegn\u00e9r","orcid":"https://orcid.org/0000-0002-9568-5588"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]},{"id":"https://openalex.org/I28166907","display_name":"Karolinska Institutet","ror":"https://ror.org/056d84691","country_code":"SE","type":"education","lineage":["https://openalex.org/I28166907"]}],"countries":["SA","SE"],"is_corresponding":false,"raw_author_name":"Tegner, Jesper N.","raw_affiliation_strings":["Karolinska Institutet, Sweden","King Abdullah University of Science and Technology, Saudi Arabia","SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;"],"affiliations":[{"raw_affiliation_string":"Karolinska Institutet, Sweden","institution_ids":["https://openalex.org/I28166907"]},{"raw_affiliation_string":"King Abdullah University of Science and Technology, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]},{"raw_affiliation_string":"SDAIA-KAUST Center of Excellence in Data Science and Artificial Intelligence;","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5027982192"],"corresponding_institution_ids":["https://openalex.org/I164861460","https://openalex.org/I71920554"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.934499979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7759705781936646},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.676705002784729},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5885533690452576},{"id":"https://openalex.org/keywords/gsm","display_name":"GSM","score":0.5205988883972168},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.51285719871521},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5042012929916382},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5014314651489258},{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.48065435886383057},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4410959780216217},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.4324640929698944},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4220244288444519}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7759705781936646},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.676705002784729},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5885533690452576},{"id":"https://openalex.org/C59201141","wikidata":"https://www.wikidata.org/wiki/Q46904","display_name":"GSM","level":2,"score":0.5205988883972168},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.51285719871521},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5042012929916382},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5014314651489258},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.48065435886383057},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4410959780216217},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.4324640929698944},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4220244288444519},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2305.11244","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11244","pdf_url":"https://arxiv.org/pdf/2305.11244","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2305.11244","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2305.11244","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2305.11244","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.11244","pdf_url":"https://arxiv.org/pdf/2305.11244","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6800000071525574,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322320","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4377298277.pdf"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W2008056655","https://openalex.org/W2091409162","https://openalex.org/W2130721836","https://openalex.org/W2157075408","https://openalex.org/W2160802179","https://openalex.org/W2786835190","https://openalex.org/W2899663614","https://openalex.org/W2962858109","https://openalex.org/W2963211188","https://openalex.org/W2963446712","https://openalex.org/W2963466763","https://openalex.org/W2963486098","https://openalex.org/W2964303773","https://openalex.org/W3016021175","https://openalex.org/W3101609372","https://openalex.org/W3119835585","https://openalex.org/W3168867926","https://openalex.org/W3172443934","https://openalex.org/W3176828726","https://openalex.org/W3201225328","https://openalex.org/W3205949070","https://openalex.org/W3207955791","https://openalex.org/W4205394650","https://openalex.org/W4210491685","https://openalex.org/W4224979832","https://openalex.org/W4225410153","https://openalex.org/W4226162428","https://openalex.org/W4289673860","https://openalex.org/W4297663785","https://openalex.org/W4298312696","https://openalex.org/W4311000453","https://openalex.org/W4372268294","https://openalex.org/W4372346241","https://openalex.org/W4385245566","https://openalex.org/W4385484947"],"related_works":["https://openalex.org/W2133028525","https://openalex.org/W4306381730","https://openalex.org/W4229060448","https://openalex.org/W2981692913","https://openalex.org/W2183593636","https://openalex.org/W2350724007","https://openalex.org/W2355751417","https://openalex.org/W3044188621","https://openalex.org/W3184035966","https://openalex.org/W2423284978"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,20],"explore":[4],"Parameter-Efficient-Learning":[5],"(PEL)":[6],"techniques":[7],"to":[8,24,53,66,106,120],"repurpose":[9],"a":[10,29,49,125],"General-Purpose-Speech":[11],"(GSM)":[12],"model":[13,44],"for":[14,57],"Arabic":[15,58,122],"dialect":[16],"identification":[17],"(ADI).":[18,61],"Specifically,":[19],"investigate":[21],"different":[22],"setups":[23],"incorporate":[25],"trainable":[26,114],"features":[27],"into":[28],"multi-layer":[30],"encoder-decoder":[31],"GSM":[32,56],"formulation":[33],"under":[34],"frozen":[35],"pre-trained":[36,136],"settings.":[37],"Our":[38,116],"architecture":[39],"includes":[40],"residual":[41],"adapter":[42],"and":[43,72,128,135],"reprogramming":[45],"(input-prompting).":[46],"We":[47,79,91],"design":[48],"token-level":[50],"label":[51],"mapping":[52],"condition":[54],"the":[55,67,75,85,94,98],"Dialect":[59],"Identification":[60],"This":[62],"is":[63],"challenging":[64],"due":[65],"high":[68],"variation":[69],"in":[70],"vocabulary":[71],"pronunciation":[73],"among":[74],"numerous":[76],"regional":[77],"dialects.":[78],"achieve":[80],"new":[81],"state-of-the-art":[82],"accuracy":[83,105],"on":[84],"ADI-17":[86],"dataset":[87,127],"by":[88],"vanilla":[89],"fine-tuning.":[90],"further":[92],"reduce":[93],"training":[95],"budgets":[96],"with":[97,131],"PEL":[99],"method,":[100],"which":[101],"performs":[102],"within":[103],"1.86%":[104],"fine-tuning":[107],"using":[108,124],"only":[109],"2.5%":[110],"of":[111],"(extra)":[112],"network":[113],"parameters.":[115],"study":[117],"demonstrates":[118],"how":[119],"identify":[121],"dialects":[123],"small":[126],"limited":[129],"computation":[130],"open":[132],"source":[133],"code":[134],"models.":[137]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
