{"id":"https://openalex.org/W7130414084","doi":"https://doi.org/10.1109/o-cocosda68185.2025.11385226","title":"A Gop-Based Automatic Pronunciation Scoring System for Taiwanese Hakka Using Transformer Regression Models","display_name":"A Gop-Based Automatic Pronunciation Scoring System for Taiwanese Hakka Using Transformer Regression Models","publication_year":2025,"publication_date":"2025-11-12","ids":{"openalex":"https://openalex.org/W7130414084","doi":"https://doi.org/10.1109/o-cocosda68185.2025.11385226"},"language":null,"primary_location":{"id":"doi:10.1109/o-cocosda68185.2025.11385226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda68185.2025.11385226","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 28th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112612990","display_name":"Yi\u2010Chin Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I1309796872","display_name":"National Pingtung University","ror":"https://ror.org/03z698x91","country_code":"TW","type":"education","lineage":["https://openalex.org/I1309796872"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Yi-Chin Huang","raw_affiliation_strings":["National Pingtung University,PingTung,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Pingtung University,PingTung,Taiwan","institution_ids":["https://openalex.org/I1309796872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054690291","display_name":"Y. J. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I1309796872","display_name":"National Pingtung University","ror":"https://ror.org/03z698x91","country_code":"TW","type":"education","lineage":["https://openalex.org/I1309796872"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yu-Heng Chen","raw_affiliation_strings":["National Pingtung University,PingTung,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Pingtung University,PingTung,Taiwan","institution_ids":["https://openalex.org/I1309796872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111415477","display_name":"Chih-Chung Kuo","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chih-Chung Kuo","raw_affiliation_strings":["National Yang Ming Chiao Tung University,HsinChu,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,HsinChu,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050297067","display_name":"Chao-Shih Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chao-Shih Huang","raw_affiliation_strings":["National Yang Ming Chiao Tung University,HsinChu,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,HsinChu,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126331085","display_name":"Yuan-Fu Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yuan-Fu Liao","raw_affiliation_strings":["National Yang Ming Chiao Tung University,HsinChu,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,HsinChu,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5112612990"],"corresponding_institution_ids":["https://openalex.org/I1309796872"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.85135672,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.7376999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.7376999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.11890000104904175,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.03819999843835831,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6331999897956848},{"id":"https://openalex.org/keywords/wilcoxon-signed-rank-test","display_name":"Wilcoxon signed-rank test","score":0.6255999803543091},{"id":"https://openalex.org/keywords/scoring-system","display_name":"Scoring system","score":0.5867999792098999},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.5054000020027161},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.47679999470710754},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4009999930858612},{"id":"https://openalex.org/keywords/linear-regression","display_name":"Linear regression","score":0.3912999927997589},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.385699987411499}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6341000199317932},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6331999897956848},{"id":"https://openalex.org/C206041023","wikidata":"https://www.wikidata.org/wiki/Q1751970","display_name":"Wilcoxon signed-rank test","level":3,"score":0.6255999803543091},{"id":"https://openalex.org/C2984538763","wikidata":"https://www.wikidata.org/wiki/Q2260590","display_name":"Scoring system","level":2,"score":0.5867999792098999},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5716000199317932},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.47679999470710754},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.43380001187324524},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4009999930858612},{"id":"https://openalex.org/C48921125","wikidata":"https://www.wikidata.org/wiki/Q10861030","display_name":"Linear regression","level":2,"score":0.3912999927997589},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.385699987411499},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.362199991941452},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.3361000120639801},{"id":"https://openalex.org/C167085575","wikidata":"https://www.wikidata.org/wiki/Q6803654","display_name":"Mean squared prediction error","level":2,"score":0.3163999915122986},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.29660001397132874},{"id":"https://openalex.org/C131109320","wikidata":"https://www.wikidata.org/wiki/Q581012","display_name":"Linear prediction","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C83282275","wikidata":"https://www.wikidata.org/wiki/Q7435350","display_name":"Scoring algorithm","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2784999907016754},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/o-cocosda68185.2025.11385226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda68185.2025.11385226","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 28th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8440479636192322}],"awards":[{"id":"https://openalex.org/G4059018954","display_name":null,"funder_award_id":"111-2221-E-A49-190MY3,113-2221-E-153-005","funder_id":"https://openalex.org/F2461203286","funder_display_name":"National Science and Technology Council"}],"funders":[{"id":"https://openalex.org/F2461203286","display_name":"National Science and Technology Council","ror":"https://ror.org/02kv4zf79"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1999114171","https://openalex.org/W2091856355","https://openalex.org/W2139008940","https://openalex.org/W2397168380","https://openalex.org/W2398741870","https://openalex.org/W2401896499","https://openalex.org/W2509051157","https://openalex.org/W3015231007","https://openalex.org/W3096674206","https://openalex.org/W3134482008","https://openalex.org/W3196525293","https://openalex.org/W3197816268","https://openalex.org/W3197938691","https://openalex.org/W4224928163","https://openalex.org/W4392902938","https://openalex.org/W4393406219"],"related_works":[],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,11,42,67,72,77],"GOP-based":[3],"pronunciation":[4],"scoring":[5,30],"system":[6,81],"for":[7,93],"Taiwanese":[8],"Hakka":[9],"using":[10],"lightweight":[12],"Transformer":[13],"regressor":[14],"over":[15],"fused":[16],"LPP/LPR":[17],"features.":[18],"Trained":[19],"on":[20,41],"<tex":[21],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[22],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\sim":[23],"20":[24],"\\mathrm{k}$</tex>":[25],"expert-rated":[26],"utterances,":[27],"our":[28],"Transformer-based":[29],"model":[31,74],"attains":[32],"MSE":[33],"0.44":[34],"/":[35,38],"MAE":[36,57],"0.51":[37],"PCC":[39,62],"0.80":[40],"speaker-independent":[43],"test":[44],"set,":[45],"outperforming":[46],"linear":[47],"and":[48,60,76],"MLP":[49],"baselines.":[50],"A":[51],"classspecific":[52],"bias":[53,78],"calibration":[54],"further":[55],"reduces":[56],"to":[58,63],"0.41":[59],"raises":[61],"0.89,":[64],"confirmed":[65],"by":[66],"Wilcoxon":[68],"signed-rank":[69],"test.":[70],"With":[71],"single":[73],"pass":[75],"calibration,":[79],"the":[80],"reaches":[82],"near":[83],"teacher-level":[84],"agreement":[85],"while":[86],"keeping":[87],"runtime":[88],"minimal,":[89],"making":[90],"it":[91],"practical":[92],"CALL":[94],"in":[95],"low-resource":[96],"settings.":[97]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-02-19T00:00:00"}
