{"id":"https://openalex.org/W4822889","doi":"https://doi.org/10.21437/interspeech.2010-616","title":"Automatic discriminative measurement of voice onset time","display_name":"Automatic discriminative measurement of voice onset time","publication_year":2010,"publication_date":"2010-09-26","ids":{"openalex":"https://openalex.org/W4822889","doi":"https://doi.org/10.21437/interspeech.2010-616","mag":"4822889"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2010-616","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-616","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050873228","display_name":"Morgan Sonderegger","orcid":"https://orcid.org/0000-0001-7675-2370"},"institutions":[{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Morgan Sonderegger","raw_affiliation_strings":["University-of Chicago"],"affiliations":[{"raw_affiliation_string":"University-of Chicago","institution_ids":["https://openalex.org/I40347166"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008847407","display_name":"Joseph Keshet","orcid":"https://orcid.org/0000-0003-2332-5783"},"institutions":[{"id":"https://openalex.org/I160992636","display_name":"Toyota Technological Institute at Chicago","ror":"https://ror.org/02sn5gb64","country_code":"US","type":"education","lineage":["https://openalex.org/I160992636"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joseph Keshet","raw_affiliation_strings":["TOYOTA TECHNOLOGICAL INSTITUTE AT CHICAGO"],"affiliations":[{"raw_affiliation_string":"TOYOTA TECHNOLOGICAL INSTITUTE AT CHICAGO","institution_ids":["https://openalex.org/I160992636"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5050873228"],"corresponding_institution_ids":["https://openalex.org/I40347166"],"apc_list":null,"apc_paid":null,"fwci":2.2552,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.8841057,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2242","last_page":"2245"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/voice-onset-time","display_name":"Voice-onset time","score":0.7981116771697998},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6033477187156677},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5924432277679443},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5593119263648987},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.4571610987186432},{"id":"https://openalex.org/keywords/audiology","display_name":"Audiology","score":0.4203932285308838},{"id":"https://openalex.org/keywords/formant","display_name":"Formant","score":0.4175293743610382},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3649035692214966},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.32406532764434814},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.27237388491630554},{"id":"https://openalex.org/keywords/voice","display_name":"Voice","score":0.1889793872833252},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.1761670708656311},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.13134422898292542},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.1269889771938324}],"concepts":[{"id":"https://openalex.org/C89051679","wikidata":"https://www.wikidata.org/wiki/Q627770","display_name":"Voice-onset time","level":3,"score":0.7981116771697998},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6033477187156677},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5924432277679443},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5593119263648987},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.4571610987186432},{"id":"https://openalex.org/C548259974","wikidata":"https://www.wikidata.org/wiki/Q569965","display_name":"Audiology","level":1,"score":0.4203932285308838},{"id":"https://openalex.org/C158215666","wikidata":"https://www.wikidata.org/wiki/Q1414685","display_name":"Formant","level":3,"score":0.4175293743610382},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3649035692214966},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.32406532764434814},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.27237388491630554},{"id":"https://openalex.org/C552089266","wikidata":"https://www.wikidata.org/wiki/Q494510","display_name":"Voice","level":2,"score":0.1889793872833252},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.1761670708656311},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.13134422898292542},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.1269889771938324}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2010-616","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-616","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W91681889","https://openalex.org/W93767964","https://openalex.org/W913849490","https://openalex.org/W1581809089","https://openalex.org/W1594989485","https://openalex.org/W1761091820","https://openalex.org/W1965672907","https://openalex.org/W1968440087","https://openalex.org/W2026219038","https://openalex.org/W2042165210","https://openalex.org/W2082302649","https://openalex.org/W2099269884","https://openalex.org/W2105644991","https://openalex.org/W2109339818","https://openalex.org/W2111477235","https://openalex.org/W2111478553","https://openalex.org/W2122106934","https://openalex.org/W2145678789","https://openalex.org/W2160218441","https://openalex.org/W2169188738","https://openalex.org/W2429914308"],"related_works":["https://openalex.org/W2046217390","https://openalex.org/W4365503437","https://openalex.org/W2362995206","https://openalex.org/W2004825552","https://openalex.org/W1986672430","https://openalex.org/W1990629684","https://openalex.org/W1971436356","https://openalex.org/W1975851543","https://openalex.org/W1970534163","https://openalex.org/W2006140286"],"abstract_inverted_index":{"Crammer,":[0],"K.,":[1],"Dekel,":[2],"O.,":[3],"Keshet,":[4],"J.,":[5,70,72,98,117,215],"Shalev-Shwartz,":[6,99,118],"S.,":[7,76,100,119],"and":[8,22,54,79,103,122,142,164,175,182,200,216,236,245,257],"Singer,":[9,101,120],"Y.":[10,238,253],"(2006).":[11,82],"Online":[12],"passive-aggressivealgorithms.":[13],"The":[14],"Journal":[15],"of":[16,27,44,84,259],"Machine":[17],"Learning":[18],"Research,":[19],"7:551\u2013585.Das,":[20],"S.":[21,81],"Hansen,":[23],"J.":[24,64,144,178,226],"(2004).":[25,203,239],"Detection":[26],"Voice":[28,58,168],"Onset":[29],"Time":[30],"(VOT)":[31],"for":[32,41,89,130,153],"unvoiced":[33],"stops":[34],"(/p/,/t/,/k/)":[35],"using":[36],"the":[37,149],"TeagerEnergy":[38],"Operator":[39],"(TEO)":[40],"automatic":[42],"detection":[43],"accented":[45],"English.":[46],"In":[47,94,112,249],"Proc.":[48,95,113,250],"6th":[49],"NORSIG,":[50],"pp.":[51,115,274],"344\u2013347.Fischer,":[52],"E.":[53],"Goberman,":[55],"A.":[56],"(2010).":[57],"onset":[59,86,169,189],"time":[60,87,170,190],"in":[61,91,208,223,263,265],"Parkinson":[62],"disease.":[63],"Comm.":[65],"Disorders,":[66],"43:21\u201334.Kazemzadeh,":[67],"A.,":[68,78],"Tepperman,":[69],"Silva,":[71],"You,":[73],"H.,":[74],"Lee,":[75],"Alwan,":[77],"Narayanan,":[80],"Automaticdetection":[83],"voice":[85,188],"contrasts":[88],"use":[90],"pronunciation":[92],"assessment.":[93],"INTERSPEECH,pp.":[96],"721\u2013724.Keshet,":[97],"Y.,":[102,121],"Chazan,":[104,123],"D.":[105,124,202,218],"(2005).":[106],"Phoneme":[107],"alignment":[108],"based":[109],"on":[110],"discriminativelearning.":[111],"INTERSPEECH,":[114],"2961\u20132964.Keshet,":[116],"(2007).":[125,254],"A":[126],"large":[127],"margin":[128],"algorithm":[129],"speech-to-phonemeand":[131],"music-to-score":[132],"alignment.":[133],"IEEE":[134],"Trans.":[135],"Audio,":[136],"Speech,":[137],"Language":[138],"Process.,":[139],"15(8):2373\u20132382.Kuhl,":[140],"P.":[141],"Miller,":[143,214],"(1978).":[145],"Speech":[146],"perception":[147],"by":[148],"chinchilla:":[150],"Identi\ufb01cation":[151],"functions":[152],"synthetic":[154],"VOT":[155,258],"stimuli.J.":[156],"Acoust.":[157,227],"Soc.":[158,228],"America,":[159,229],"63(3):905\u2013917.Morris,":[160],"R.,":[161,213],"McCrea,":[162],"C.,":[163,199],"Herring,":[165],"K.":[166],"(2008b).":[167],"differences":[171,222],"between":[172],"adult":[173],"males":[174],"females:Isolated":[176],"syllables.":[177],"Phonetics,":[179],"36(2):308\u2013317.Stouten,":[180],"V.":[181],"van":[183],"Hamme,":[184],"H.":[185],"(2009).":[186],"Automatic":[187],"estimation":[191],"from":[192],"reassignment":[193],"spectra.":[194],"SpeechCommunication,":[195],"51(12):1194\u20131205.Taskar,":[196],"B.,":[197],"Guestrin,":[198],"Koller,":[201],"Max-margin":[204],"Markov":[205],"networks.":[206],"Advances":[207],"Neural":[209],"InformationProcessing":[210],"Systems,":[211],"16.Theodore,":[212],"DeSteno,":[217],"(2009b).":[219],"Individual":[220],"talker":[221],"voice-onset-time:":[224],"Contextualin\ufb02uences.":[225],"125:3974\u20133982.Tsochantaridis,":[230],"I.,":[231],"Hofmann,":[232],"T.,":[233,235],"Joachims,":[234],"Altun,":[237],"Support":[240],"vector":[241],"machine":[242],"learning":[243],"forinterdependent":[244],"structured":[246],"output":[247],"spaces.":[248],"21st":[251],"ICML.Yao,":[252],"Closure":[255],"duration":[256],"word-initial":[260],"voiceless":[261],"plosives":[262],"English":[264],"spontaneous":[266],"connectedspeech.":[267],"UC":[268],"Berkeley":[269],"Phonology":[270],"Lab":[271],"Annual":[272],"Report,":[273],"183\u2013225.":[275]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":5},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
