{"id":"https://openalex.org/W7144084644","doi":"https://doi.org/10.1016/j.wocn.2026.101495","title":"A new kid on the block: Distributional semantics predicts the word-specific tone signatures of monosyllabic words in conversational Taiwan Mandarin speech","display_name":"A new kid on the block: Distributional semantics predicts the word-specific tone signatures of monosyllabic words in conversational Taiwan Mandarin speech","publication_year":2026,"publication_date":"2026-03-31","ids":{"openalex":"https://openalex.org/W7144084644","doi":"https://doi.org/10.1016/j.wocn.2026.101495"},"language":"en","primary_location":{"id":"doi:10.1016/j.wocn.2026.101495","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.wocn.2026.101495","pdf_url":null,"source":{"id":"https://openalex.org/S42504509","display_name":"Journal of Phonetics","issn_l":"0095-4470","issn":["0095-4470","1095-8576"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Phonetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.wocn.2026.101495","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110220606","display_name":"Xiaoyun Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Xiaoyun Jin","raw_affiliation_strings":["Quantitative Linguistics, Eberhard Karls Universit\u00e4t T\u00fcbingen, 72074 T\u00fcbingen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Quantitative Linguistics, Eberhard Karls Universit\u00e4t T\u00fcbingen, 72074 T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I8087733"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091677603","display_name":"Mirjam Ernestus","orcid":"https://orcid.org/0000-0002-1853-0750"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mirjam Ernestus","raw_affiliation_strings":["Center for Language Studies, Radboud University, 6525 HT Nijmegen, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Language Studies, Radboud University, 6525 HT Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5131025922","display_name":"R. Harald Baayen","orcid":null},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"R. Harald Baayen","raw_affiliation_strings":["Quantitative Linguistics, Eberhard Karls Universit\u00e4t T\u00fcbingen, 72074 T\u00fcbingen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Quantitative Linguistics, Eberhard Karls Universit\u00e4t T\u00fcbingen, 72074 T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I8087733"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110220606"],"corresponding_institution_ids":["https://openalex.org/I8087733"],"apc_list":{"value":3470,"currency":"USD","value_usd":3470},"apc_paid":{"value":3470,"currency":"USD","value_usd":3470},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65424281,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"116","issue":null,"first_page":"101495","last_page":"101495"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.003100000089034438,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.00279999990016222,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/homophone","display_name":"Homophone","score":0.7843000292778015},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.6823999881744385},{"id":"https://openalex.org/keywords/realization","display_name":"Realization (probability)","score":0.618399977684021},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5493000149726868},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5113999843597412},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.4690000116825104},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.40139999985694885},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.40119999647140503}],"concepts":[{"id":"https://openalex.org/C160253069","wikidata":"https://www.wikidata.org/wiki/Q221079","display_name":"Homophone","level":2,"score":0.7843000292778015},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.6823999881744385},{"id":"https://openalex.org/C2781089630","wikidata":"https://www.wikidata.org/wiki/Q21856745","display_name":"Realization (probability)","level":2,"score":0.618399977684021},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5595999956130981},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5493000149726868},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5450999736785889},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5113999843597412},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.4690000116825104},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.40139999985694885},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.40119999647140503},{"id":"https://openalex.org/C148934300","wikidata":"https://www.wikidata.org/wiki/Q40998","display_name":"Phonology","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C2780583480","wikidata":"https://www.wikidata.org/wiki/Q1366327","display_name":"Tone (literature)","level":2,"score":0.3808000087738037},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37940001487731934},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35899999737739563},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.34529998898506165},{"id":"https://openalex.org/C2777895490","wikidata":"https://www.wikidata.org/wiki/Q7198848","display_name":"Pitch contour","level":2,"score":0.34389999508857727},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3425999879837036},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.334199994802475},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.3172999918460846},{"id":"https://openalex.org/C165297611","wikidata":"https://www.wikidata.org/wiki/Q43249","display_name":"Morpheme","level":2,"score":0.3125999867916107},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.wocn.2026.101495","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.wocn.2026.101495","pdf_url":null,"source":{"id":"https://openalex.org/S42504509","display_name":"Journal of Phonetics","issn_l":"0095-4470","issn":["0095-4470","1095-8576"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Phonetics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.wocn.2026.101495","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.wocn.2026.101495","pdf_url":null,"source":{"id":"https://openalex.org/S42504509","display_name":"Journal of Phonetics","issn_l":"0095-4470","issn":["0095-4470","1095-8576"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Phonetics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.6347189545631409,"display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1550323663","https://openalex.org/W1590424750","https://openalex.org/W1922189308","https://openalex.org/W1966208681","https://openalex.org/W1971415599","https://openalex.org/W1979633237","https://openalex.org/W1980884156","https://openalex.org/W1990294283","https://openalex.org/W1993533823","https://openalex.org/W2017354652","https://openalex.org/W2024178270","https://openalex.org/W2038784064","https://openalex.org/W2047138445","https://openalex.org/W2058518981","https://openalex.org/W2062455228","https://openalex.org/W2079833689","https://openalex.org/W2080622004","https://openalex.org/W2082472210","https://openalex.org/W2089022621","https://openalex.org/W2089760518","https://openalex.org/W2093017178","https://openalex.org/W2094008654","https://openalex.org/W2095909472","https://openalex.org/W2103919430","https://openalex.org/W2122303223","https://openalex.org/W2140188190","https://openalex.org/W2142635246","https://openalex.org/W2235769802","https://openalex.org/W2741450539","https://openalex.org/W2779408229","https://openalex.org/W2907162900","https://openalex.org/W2974832207","https://openalex.org/W2990278625","https://openalex.org/W2991634148","https://openalex.org/W3108547583","https://openalex.org/W3111163315","https://openalex.org/W3154165903","https://openalex.org/W3171824216","https://openalex.org/W3192538883","https://openalex.org/W3195494389","https://openalex.org/W4213178566","https://openalex.org/W4283463084","https://openalex.org/W4291949777","https://openalex.org/W4310742622","https://openalex.org/W4400165301","https://openalex.org/W4405397248"],"related_works":[],"abstract_inverted_index":{"\u2022":[0,11,23,32,43],"GAMs":[1],"reveal":[2],"new":[3,214],"insights":[4],"into":[5,94],"tonal":[6,14,121,140],"realization":[7,15],"in":[8,39,70],"conversational":[9,41,72],"Mandarin.":[10],"The":[12,175],"detailed":[13],"of":[16,60,65,78,97,133,139,148,181,188,225,235],"monosyllabic":[17,66],"words":[18,67],"is":[19,46,150,156,183,212],"co-determined":[20],"by":[21],"semantics.":[22],"Several":[24],"heterographic":[25,166],"homophones":[26,167],"have":[27,171],"systematically":[28],"distinct":[29],"F0":[30],"contours.":[31,174],"Phonological":[33],"tones":[34],"play":[35],"a":[36,57,89,95,136,151,160,205,213],"minor":[37],"role":[38],"spontaneous":[40,71],"speech.":[42],"Their":[44],"effect":[45,132,147],"mostly":[47],"constrained":[48],"to":[49,87,104,158,170],"pitch":[50,63,92,99,173,186],"height":[51],"except":[52],"for":[53,178],"T4.":[54],"We":[55,81,142],"present":[56,143],"corpus-based":[58],"investigation":[59],"how":[61],"the":[62,76,83,131,179,185,217,232,236],"contours":[64,100,187],"are":[68,102,128,168],"realized":[69],"Mandarin,":[73],"focusing":[74],"on":[75,216],"effects":[77],"words\u2019":[79],"meanings.":[80],"used":[82],"generalized":[84],"additive":[85],"model":[86],"decompose":[88],"given":[90],"observed":[91],"contour":[93],"set":[96],"component":[98],"that":[101,145,184,202],"tied":[103],"different":[105,172],"control":[106],"variables":[107,113],"and":[108,125,165],"semantic":[109,152],"predictors.":[110],"Even":[111],"when":[112],"such":[114],"as":[115],"word":[116,134,149,154,190],"duration,":[117],"gender,":[118],"speaker":[119],"identity,":[120],"context,":[122],"vowel":[123],"height,":[124],"utterance":[126],"position":[127],"controlled":[129],"for,":[130],"remains":[135],"strong":[137],"predictor":[138,162],"realization.":[141],"evidence":[144,177],"this":[146],"effect:":[153],"sense":[155],"shown":[157,169],"be":[159,193],"better":[161],"than":[163],"word,":[164],"strongest":[176],"importance":[180],"semantics":[182,211],"individual":[189],"tokens":[191],"can":[192],"predicted":[194],"from":[195],"their":[196],"contextualized":[197],"embeddings":[198],"with":[199],"an":[200],"accuracy":[201],"substantially":[203],"exceeds":[204],"permutation":[206],"baseline.":[207],"For":[208],"phonetics,":[209],"distributional":[210],"kid":[215],"block.":[218],"Although":[219],"our":[220],"findings":[221],"challenge":[222],"standard":[223],"theories":[224],"Mandarin":[226],"tone,":[227],"they":[228],"fit":[229],"well":[230],"within":[231],"theoretical":[233],"framework":[234],"Discriminative":[237],"Lexicon":[238],"Model.":[239]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-01T00:00:00"}
