{"id":"https://openalex.org/W4321015971","doi":"https://doi.org/10.29007/1ppr","title":"Design and Evaluation of a Cross-Lingual ML-based Automatic Speech Recognition System Fine-tuned for the Galician Language","display_name":"Design and Evaluation of a Cross-Lingual ML-based Automatic Speech Recognition System Fine-tuned for the Galician Language","publication_year":2023,"publication_date":"2023-02-16","ids":{"openalex":"https://openalex.org/W4321015971","doi":"https://doi.org/10.29007/1ppr"},"language":"en","primary_location":{"id":"doi:10.29007/1ppr","is_oa":true,"landing_page_url":"https://doi.org/10.29007/1ppr","pdf_url":"https://easychair.org/publications/open/hdqh","source":{"id":"https://openalex.org/S4220650884","display_name":"Kalpa publications in computing","issn_l":"2515-1762","issn":["2515-1762"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kalpa Publications in Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://easychair.org/publications/open/hdqh","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020925290","display_name":"Iv\u00e1n Froiz-M\u00edguez","orcid":"https://orcid.org/0000-0003-4068-8842"},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Iv\u00e1n Froiz-M\u00edguez","raw_affiliation_strings":["Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]},{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038858572","display_name":"\u00d3scar Blanco-Novoa","orcid":"https://orcid.org/0000-0002-8608-1088"},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"\u00d3scar Blanco-Novoa","raw_affiliation_strings":["Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]},{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090443440","display_name":"Paula Fraga\u2010Lamas","orcid":"https://orcid.org/0000-0002-4991-6808"},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Paula Fraga-Lamas","raw_affiliation_strings":["Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]},{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075104449","display_name":"Diego Fustes","orcid":null},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Diego Fustes","raw_affiliation_strings":["Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009521856","display_name":"Jos\u00e9 Carlos Dafonte V\u00e1zquez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Carlos Dafonte V\u00e1zquez","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000477332","display_name":"Javier Pereira","orcid":"https://orcid.org/0000-0001-9328-0723"},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Javier Pereira","raw_affiliation_strings":["Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081216987","display_name":"Tiago M. Fern\u00e1ndez\u2010Caram\u00e9s","orcid":"https://orcid.org/0000-0003-2179-5917"},"institutions":[{"id":"https://openalex.org/I11019714","display_name":"Universidade da Coru\u00f1a","ror":"https://ror.org/01qckj285","country_code":"ES","type":"education","lineage":["https://openalex.org/I11019714"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Tiago M. Fern\u00e1ndez-Caram\u00e9s","raw_affiliation_strings":["Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centro de investigaci\u00f3n CITIC, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]},{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Computer Science, Universidade da Coru\u00f1a, 15071 A Coru\u00f1a, Spain","institution_ids":["https://openalex.org/I11019714"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3263,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.62167038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"14","issue":null,"first_page":"152","last_page":"147"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8307349681854248},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5873188972473145},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.580082356929779},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5355377793312073},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5136777758598328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49894094467163086},{"id":"https://openalex.org/keywords/human-language","display_name":"Human language","score":0.44585490226745605},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.44193243980407715},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.4317755699157715},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4114450216293335}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8307349681854248},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5873188972473145},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.580082356929779},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5355377793312073},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5136777758598328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49894094467163086},{"id":"https://openalex.org/C2993724205","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Human language","level":2,"score":0.44585490226745605},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44193243980407715},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.4317755699157715},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4114450216293335},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.29007/1ppr","is_oa":true,"landing_page_url":"https://doi.org/10.29007/1ppr","pdf_url":"https://easychair.org/publications/open/hdqh","source":{"id":"https://openalex.org/S4220650884","display_name":"Kalpa publications in computing","issn_l":"2515-1762","issn":["2515-1762"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kalpa Publications in Computing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.29007/1ppr","is_oa":true,"landing_page_url":"https://doi.org/10.29007/1ppr","pdf_url":"https://easychair.org/publications/open/hdqh","source":{"id":"https://openalex.org/S4220650884","display_name":"Kalpa publications in computing","issn_l":"2515-1762","issn":["2515-1762"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kalpa Publications in Computing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6399999856948853,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4321015971.pdf"},"referenced_works_count":7,"referenced_works":["https://openalex.org/W2134800885","https://openalex.org/W2922073769","https://openalex.org/W2954460650","https://openalex.org/W3030374183","https://openalex.org/W3036601975","https://openalex.org/W3204917342","https://openalex.org/W6760602923"],"related_works":["https://openalex.org/W4297849468","https://openalex.org/W2797876554","https://openalex.org/W2594897229","https://openalex.org/W2151348424","https://openalex.org/W4221142855","https://openalex.org/W2050138804","https://openalex.org/W2944691285","https://openalex.org/W4290708361","https://openalex.org/W2129812225","https://openalex.org/W26527944"],"abstract_inverted_index":{"In":[0],"recent":[1],"years":[2],"Machine":[3],"Learning":[4],"(ML)":[5],"strategies":[6,63],"have":[7],"proven":[8],"to":[9,12,24,48,97,111,115,138,160],"be":[10,112],"useful":[11],"automate":[13],"numerous":[14],"classification":[15],"and":[16,157],"pattern":[17],"detection":[18],"tasks":[19],"in":[20,30,87,102,127],"diverse":[21],"fields":[22,35],"thanks":[23,137],"the":[25,37,84,91,116,132,139,158,163,174,231],"increase":[26],"of":[27,33,83,94,106,141,154,169,226],"computational":[28],"power":[29],"hardware.":[31],"One":[32],"such":[34],"is":[36,90,108,202,219],"Automatic":[38],"Speech":[39],"Recog-":[40],"nition":[41],"(ASR),":[42],"which":[43,208],"can":[44,64,176],"use":[45,140],"ML":[46,62],"architectures":[47,89,182],"transcribe":[49],"human":[50,77,120],"speech":[51,224],"into":[52],"readable":[53],"text.":[54],"The":[55],"Word":[56],"Error":[57],"Rate":[58],"(WER)":[59],"obtained":[60,164],"with":[61,147,166,189,221],"become":[65],"relatively":[66,236],"low":[67,100,237],"while":[68],"providing":[69],"quick":[70],"responses,":[71],"reaching":[72],"accuracy":[73],"levels":[74],"that":[75,179,201],"approach":[76],"tran-":[78],"scription":[79],"accuracy.":[80],"However,":[81],"one":[82],"main":[85],"drawbacks":[86],"traditional":[88],"high":[92,117],"demand":[93],"transcribed":[95],"data":[96,107],"obtain":[98,177],"a":[99,123,142,170,206,217,222,235],"WER":[101,238],"training.":[103],"This":[104,191],"kind":[105],"particularly":[109],"hard":[110],"achieved":[113],"due":[114],"dependency":[118],"on":[119,150,198],"processing.":[121],"Luckily,":[122],"new":[124],"framework":[125,175],"proposed":[126],"2020":[128],"(wav2vec2),":[129],"considerably":[130],"reduces":[131],"need":[133],"for":[134,204],"audio":[135,187,213],"labelling":[136],"Convolutional":[143],"Neural":[144],"Network":[145],"(CNN)":[146],"self-supervised":[148],"training":[149],"cross-lingual":[151],"unlabelled":[152],"audios":[153,168],"multiple":[155],"languages":[156],"ability":[159],"fine-":[161],"tune":[162],"results":[165,178],"labelled":[167],"specific":[171],"language.":[172],"Thus,":[173],"outperform":[180],"previous":[181],"by":[183],"using":[184],"much":[185],"smaller":[186],"datasets":[188,214],"transcriptions.":[190],"paper":[192],"presents":[193],"an":[194],"ASR":[195],"system":[196,218],"based":[197],"wav2vec":[199],"2.0":[200],"fine-tuned":[203],"Galician,":[205],"language":[207],"currently":[209],"only":[210],"has":[211],"small":[212],"available.":[215],"Such":[216],"evaluated":[220],"spontaneous":[223],"dataset":[225],"approximately":[227],"1":[228],"hour":[229],"from":[230],"Galicia":[232],"Parliament,":[233],"showing":[234],"(18.61%).":[239]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
