{"id":"https://openalex.org/W4400747285","doi":"https://doi.org/10.1186/s13636-024-00361-7","title":"Exploring task-diverse meta-learning on Tibetan multi-dialect speech recognition","display_name":"Exploring task-diverse meta-learning on Tibetan multi-dialect speech recognition","publication_year":2024,"publication_date":"2024-07-17","ids":{"openalex":"https://openalex.org/W4400747285","doi":"https://doi.org/10.1186/s13636-024-00361-7"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-024-00361-7","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1186/s13636-024-00361-7","pdf_url":"https://link.springer.com/content/pdf/10.1186/s13636-024-00361-7.pdf","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1186/s13636-024-00361-7.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110451996","display_name":"Y. Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yigang Liu","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","School of Information Engineering, Minzu University of China, Beijing, 100081, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108956725","display_name":"Yue Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Zhao","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","School of Information Engineering, Minzu University of China, Beijing, 100081, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045844800","display_name":"Xiaona Xu","orcid":"https://orcid.org/0000-0001-8715-1618"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaona Xu","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","School of Information Engineering, Minzu University of China, Beijing, 100081, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100673719","display_name":"Liang Xu","orcid":"https://orcid.org/0000-0001-8171-0247"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Xu","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","School of Information Engineering, Minzu University of China, Beijing, 100081, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, 100081, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073899717","display_name":"Xubei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xubei Zhang","raw_affiliation_strings":["Linguistics & Computer Science, Boston University, Boston, 02215, USA"],"affiliations":[{"raw_affiliation_string":"Linguistics & Computer Science, Boston University, Boston, 02215, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076346273","display_name":"Qiang Ji","orcid":"https://orcid.org/0000-0002-4302-2889"},"institutions":[{"id":"https://openalex.org/I165799507","display_name":"Rensselaer Polytechnic Institute","ror":"https://ror.org/01rtyzb94","country_code":"US","type":"education","lineage":["https://openalex.org/I165799507"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qiang Ji","raw_affiliation_strings":["Department of Electrical, Computer, and Systems Engineering, Rensselaer Polytechnic Institute, Troy, NY, 12180-3590, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical, Computer, and Systems Engineering, Rensselaer Polytechnic Institute, Troy, NY, 12180-3590, USA","institution_ids":["https://openalex.org/I165799507"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5110451996"],"corresponding_institution_ids":["https://openalex.org/I145897649"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":0.7071,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.74734386,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"2024","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7750080823898315},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6828296780586243},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.6747559905052185},{"id":"https://openalex.org/keywords/phonetics","display_name":"Phonetics","score":0.4972074329853058},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4551633596420288},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.44342318177223206},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37042778730392456},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3098875880241394},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.16332119703292847}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7750080823898315},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6828296780586243},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6747559905052185},{"id":"https://openalex.org/C137584468","wikidata":"https://www.wikidata.org/wiki/Q35395","display_name":"Phonetics","level":2,"score":0.4972074329853058},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4551633596420288},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44342318177223206},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37042778730392456},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3098875880241394},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.16332119703292847},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s13636-024-00361-7","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1186/s13636-024-00361-7","pdf_url":"https://link.springer.com/content/pdf/10.1186/s13636-024-00361-7.pdf","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:aca1be2657d9409b9fc2a5c900804861","is_oa":true,"landing_page_url":"https://doaj.org/article/aca1be2657d9409b9fc2a5c900804861","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing, Vol 2024, Iss 1, Pp 1-8 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s13636-024-00361-7","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1186/s13636-024-00361-7","pdf_url":"https://link.springer.com/content/pdf/10.1186/s13636-024-00361-7.pdf","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7200000286102295,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1660390292","display_name":null,"funder_award_id":"61976236","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4400747285.pdf","grobid_xml":"https://content.openalex.org/works/W4400747285.grobid-xml"},"referenced_works_count":17,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2888541716","https://openalex.org/W2963043696","https://openalex.org/W2963242190","https://openalex.org/W2963292011","https://openalex.org/W2971840980","https://openalex.org/W2984865357","https://openalex.org/W3015585292","https://openalex.org/W3097777922","https://openalex.org/W3120988557","https://openalex.org/W3210277894","https://openalex.org/W3213544594","https://openalex.org/W4225739182","https://openalex.org/W4285603108","https://openalex.org/W4296068994","https://openalex.org/W4296840126","https://openalex.org/W4393973323"],"related_works":["https://openalex.org/W2373696876","https://openalex.org/W2302349196","https://openalex.org/W2038248067","https://openalex.org/W2392602970","https://openalex.org/W2351370781","https://openalex.org/W2372700028","https://openalex.org/W2353456508","https://openalex.org/W2377459180","https://openalex.org/W2367325839","https://openalex.org/W2997567050"],"abstract_inverted_index":{"Abstract":[0],"The":[1,103],"disparities":[2],"in":[3,95,114,137],"phonetics":[4],"and":[5,45,64,86,123],"corpuses":[6],"across":[7],"the":[8,15,52,69,78,81,92,121,131],"three":[9],"major":[10],"dialects":[11],"of":[12,17,80,125,133],"Tibetan":[13,60,65,96,115],"exacerbate":[14],"difficulty":[16],"a":[18],"single":[19],"task":[20],"model":[21,40,82],"for":[22,72],"one":[23],"dialect":[24,61],"to":[25,51,76,83,111,130],"accommodate":[26],"other":[27],"different":[28,55,89],"dialects.":[29,56,90],"To":[30],"address":[31],"this":[32,34],"issue,":[33],"paper":[35],"proposes":[36],"task-diverse":[37,108,126],"meta-learning.":[38],"Our":[39],"can":[41],"acquire":[42],"more":[43],"comprehensive":[44],"robust":[46],"features,":[47],"facilitating":[48],"its":[49],"adaptation":[50],"variations":[53,85],"among":[54,88],"This":[57,119],"study":[58],"uses":[59],"ID":[62],"recognition":[63,67,99,135],"speaker":[66],"as":[68],"source":[70],"tasks":[71,100],"meta-learning,":[73,127],"which":[74],"aims":[75],"augment":[77],"ability":[79],"discriminate":[84],"differences":[87],"Consequently,":[91],"model\u2019s":[93],"performance":[94,113],"multi-dialect":[97,116,138],"speech":[98,117,134],"is":[101],"enhanced.":[102],"experimental":[104],"results":[105],"show":[106],"that":[107],"meta-learning":[109],"leads":[110],"improved":[112],"recognition.":[118],"demonstrates":[120],"effectiveness":[122],"applicability":[124],"thereby":[128],"contributing":[129],"advancement":[132],"techniques":[136],"environments.":[139]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-22T08:09:32.410652","created_date":"2025-10-10T00:00:00"}
