{"id":"https://openalex.org/W4319862413","doi":"https://doi.org/10.1109/slt54892.2023.10023307","title":"Automatic Prediction of Intelligibility of Words and Phonemes Produced Orally by Japanese Learners of English","display_name":"Automatic Prediction of Intelligibility of Words and Phonemes Produced Orally by Japanese Learners of English","publication_year":2023,"publication_date":"2023-01-09","ids":{"openalex":"https://openalex.org/W4319862413","doi":"https://doi.org/10.1109/slt54892.2023.10023307"},"language":"en","primary_location":{"id":"doi:10.1109/slt54892.2023.10023307","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt54892.2023.10023307","pdf_url":null,"source":{"id":"https://openalex.org/S4363605953","display_name":"2022 IEEE Spoken Language Technology Workshop (SLT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059375680","display_name":"Chuanbo Zhu","orcid":"https://orcid.org/0000-0002-6441-1162"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Chuanbo Zhu","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009308374","display_name":"Takuya Kunihara","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takuya Kunihara","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010841595","display_name":"Daisuke Saito","orcid":"https://orcid.org/0000-0003-3200-579X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Daisuke Saito","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041213266","display_name":"Nobuaki Minematsu","orcid":"https://orcid.org/0000-0002-8778-9555"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nobuaki Minematsu","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056215234","display_name":"Noriko Nakanishi","orcid":null},"institutions":[{"id":"https://openalex.org/I27650515","display_name":"Kobe Gakuin University","ror":"https://ror.org/018v0zv10","country_code":"JP","type":"education","lineage":["https://openalex.org/I27650515"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Noriko Nakanishi","raw_affiliation_strings":["Kobe Gakuin University,Faculty of Global Communication","Faculty of Global Communication, Kobe Gakuin University"],"affiliations":[{"raw_affiliation_string":"Kobe Gakuin University,Faculty of Global Communication","institution_ids":["https://openalex.org/I27650515"]},{"raw_affiliation_string":"Faculty of Global Communication, Kobe Gakuin University","institution_ids":["https://openalex.org/I27650515"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5059375680"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.4514,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.52993233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1029","last_page":"1036"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.8795177936553955},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7435528039932251},{"id":"https://openalex.org/keywords/dictation","display_name":"Dictation","score":0.7078237533569336},{"id":"https://openalex.org/keywords/active-listening","display_name":"Active listening","score":0.6570793390274048},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6299042105674744},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5088996887207031},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.4706776738166809},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4647940993309021},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.42865562438964844},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.422462522983551},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.22670435905456543},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.10726672410964966}],"concepts":[{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.8795177936553955},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7435528039932251},{"id":"https://openalex.org/C2779077324","wikidata":"https://www.wikidata.org/wiki/Q1087138","display_name":"Dictation","level":2,"score":0.7078237533569336},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.6570793390274048},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6299042105674744},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5088996887207031},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.4706776738166809},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4647940993309021},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.42865562438964844},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.422462522983551},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.22670435905456543},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.10726672410964966},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/slt54892.2023.10023307","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt54892.2023.10023307","pdf_url":null,"source":{"id":"https://openalex.org/S4363605953","display_name":"2022 IEEE Spoken Language Technology Workshop (SLT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.800000011920929,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1528457303","https://openalex.org/W2016381774","https://openalex.org/W2141720691","https://openalex.org/W2168473804","https://openalex.org/W2294870026","https://openalex.org/W2395066838","https://openalex.org/W2407314578","https://openalex.org/W2795877574","https://openalex.org/W2886359708","https://openalex.org/W2888973864","https://openalex.org/W2896457183","https://openalex.org/W2904091155","https://openalex.org/W2939437245","https://openalex.org/W2970641574","https://openalex.org/W3082212896","https://openalex.org/W3096875076","https://openalex.org/W3171839429","https://openalex.org/W3191382312","https://openalex.org/W4210506357","https://openalex.org/W4239690503","https://openalex.org/W4296068601","https://openalex.org/W4297841614","https://openalex.org/W6631362777","https://openalex.org/W6755207826"],"related_works":["https://openalex.org/W1517743118","https://openalex.org/W2365918773","https://openalex.org/W2363881323","https://openalex.org/W4323363096","https://openalex.org/W2115497217","https://openalex.org/W1989181678","https://openalex.org/W2126233554","https://openalex.org/W1561310868","https://openalex.org/W2159515240","https://openalex.org/W1563618553"],"abstract_inverted_index":{"The":[0],"practical":[1],"goal":[2],"for":[3,43],"language":[4,112,120,200],"learning":[5],"is":[6,52,137],"smooth":[7],"communication":[8],"with":[9,78,95,110,130],"others,":[10],"and":[11,49,63,148,162],"many":[12],"teachers":[13],"have":[14,198],"a":[15,75,83,96,103,133,165],"strong":[16],"focus":[17],"on":[18,118],"measurement":[19],"of":[20,29,35,55,57,61,74,144,159,164],"not":[21,38],"accentedness":[22],"but":[23],"intelligibility,":[24],"often":[25],"regarded":[26],"as":[27,47],"correctness":[28],"actual":[30],"understanding.":[31],"However,":[32],"automatic":[33],"prediction":[34],"intelligibility":[36,79,91,116,143,160],"has":[37,178],"been":[39],"well":[40,195],"developed":[41],"especially":[42],"smaller":[44],"units":[45],"such":[46],"words":[48,147],"phonemes.":[50],"This":[51],"mainly":[53],"because":[54],"difficulty":[56],"measuring":[58],"while-listening":[59],"behaviors":[60],"listeners,":[62],"thus":[64],"it":[65],"was":[66],"difficult":[67],"to":[68,81,101,139,168],"build":[69],"an":[70],"L2":[71,151],"speech":[72],"corpus":[73,106],"sufficient":[76],"size":[77],"annotation":[80],"train":[82],"network-based":[84],"predictor.":[85],"In":[86],"this":[87,131],"paper,":[88],"we":[89],"annotate":[90],"using":[92],"oral":[93],"dictation":[94],"small":[97],"delay,":[98],"i.e.,":[99,157],"shadowing,":[100],"collect":[102],"large":[104],"enough":[105],"from":[107],"two":[108,192],"raters":[109,193],"different":[111,199],"backgrounds.":[113],"Since":[114],"perceived":[115],"depends":[117],"their":[119],"background,":[121],"inter-rater":[122],"difference":[123],"should":[124],"be":[125,169],"taken":[126],"into":[127],"account.":[128],"Therefore":[129],"corpus,":[132],"multi-rater":[134],"neural":[135],"model":[136,177,188],"built":[138],"predict":[140],"each":[141],"rater's":[142],"the":[145,191],"individual":[146],"phonemes":[149],"in":[150],"speech.":[152],"Two":[153],"tasks":[154],"are":[155],"examined,":[156],"regression":[158],"scores":[161,181],"classification":[163],"given":[166],"segment":[167],"intelligible":[170],"or":[171],"not.":[172],"Results":[173],"show":[174],"that":[175,186],"our":[176,187],"higher":[179],"F1":[180],"than":[182],"intra-rater":[183],"agreements,":[184],"indicating":[185],"can":[189],"simulate":[190],"accurately":[194],"although":[196],"they":[197],"background.":[201]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
