{"id":"https://openalex.org/W91116557","doi":"https://doi.org/10.21437/interspeech.2006-53","title":"The vocal joystick data collection effort and vowel corpus","display_name":"The vocal joystick data collection effort and vowel corpus","publication_year":2006,"publication_date":"2006-09-17","ids":{"openalex":"https://openalex.org/W91116557","doi":"https://doi.org/10.21437/interspeech.2006-53","mag":"91116557"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2006-53","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2006-53","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2006","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009351378","display_name":"Kelley Kilanski","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kelley Kilanski","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111946966","display_name":"Jonathan Malkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jonathan Malkin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100375302","display_name":"Xiao Li","orcid":"https://orcid.org/0000-0002-7318-7879"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006429520","display_name":"Richard Wright","orcid":"https://orcid.org/0000-0003-1545-3689"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Richard Wright","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5113478221","display_name":"Jeff Bilmes","orcid":null},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeff A. Bilmes","raw_affiliation_strings":["University of Washington"],"affiliations":[{"raw_affiliation_string":"University of Washington","institution_ids":["https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5009351378"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.6521,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.94208307,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"paper 1885","last_page":"Tue2WeO.2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/joystick","display_name":"Joystick","score":0.8143942356109619},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7567939758300781},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.7008358240127563},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6233007311820984},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.585166871547699},{"id":"https://openalex.org/keywords/diphthong","display_name":"Diphthong","score":0.5550904273986816},{"id":"https://openalex.org/keywords/timit","display_name":"TIMIT","score":0.4483569264411926},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.17851480841636658},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.17667967081069946}],"concepts":[{"id":"https://openalex.org/C96439379","wikidata":"https://www.wikidata.org/wiki/Q178805","display_name":"Joystick","level":2,"score":0.8143942356109619},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7567939758300781},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.7008358240127563},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6233007311820984},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.585166871547699},{"id":"https://openalex.org/C76978605","wikidata":"https://www.wikidata.org/wiki/Q102532","display_name":"Diphthong","level":3,"score":0.5550904273986816},{"id":"https://openalex.org/C2778724510","wikidata":"https://www.wikidata.org/wiki/Q7670405","display_name":"TIMIT","level":3,"score":0.4483569264411926},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.17851480841636658},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.17667967081069946},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2006-53","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2006-53","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2006","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.78.5823","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.78.5823","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ssli.ee.washington.edu/people/bilmes/mypapers/VJ_ICSLP_2006_v8.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W1986597001","https://openalex.org/W2000982178","https://openalex.org/W2011236050","https://openalex.org/W2061415165","https://openalex.org/W2129813427","https://openalex.org/W2155336872"],"related_works":["https://openalex.org/W2184417239","https://openalex.org/W3156562711","https://openalex.org/W332553347","https://openalex.org/W2376341893","https://openalex.org/W2027612706","https://openalex.org/W2964322844","https://openalex.org/W2794262140","https://openalex.org/W1788546957","https://openalex.org/W2141601825","https://openalex.org/W2204818624"],"abstract_inverted_index":{"Vocal":[0,176],"Joystick":[1,177],"is":[2,148],"a":[3,21,69,75,89,99,149,202],"mechanism":[4],"that":[5,78,93],"enables":[6],"individuals":[7,221],"with":[8,65,222],"motor":[9],"impairments":[10],"to":[11,17,32,46,62,126],"make":[12],"use":[13],"of":[14,96,101,114,129,135,143,152,156,160,165,183,205],"vocal":[15],"parameters":[16,119,138,182],"control":[18,33],"objects":[19],"on":[20],"computer":[22],"screen":[23],"(buttons,":[24],"sliders,":[25],"etc.)":[26],"and":[27,122,168,186,200],"ultimately":[28],"will":[29],"be":[30],"used":[31],"electro-mechanical":[34],"instruments":[35],"(e.g.,":[36],"robotic":[37],"arms,":[38],"wireless":[39],"home":[40],"automation":[41],"devices).":[42],"In":[43],"an":[44],"effort":[45,73,116,147],"train":[47],"the":[48,53,83,97,102,112,115,127,130,136,144,166,175,181,192,206],"VJ-system,":[49],"speech":[50,55,216],"data":[51,71,107,132,145,158,193,213],"from":[52],"TIMIT":[54],"corpus":[56,92,151],"was":[57,94],"initially":[58],"used.":[59],"However,":[60],"due":[61],"problematic":[63,84],"issues":[64],"co-articulation,":[66],"we":[67],"began":[68],"large":[70],"collection":[72,108,146,194,214],"in":[74,133],"controlled":[76],"environment":[77],"would":[79,104],"not":[80],"only":[81],"address":[82],"issues,":[85],"but":[86],"also":[87],"yield":[88],"new":[90,118],"vowel":[91,150,169],"representative":[95],"utterances":[98],"user":[100],"VJ-system":[103],"use.":[105],"The":[106,141],"process":[109],"evolved":[110,196],"over":[111],"course":[113],"as":[117,123],"were":[120,139],"added":[121],"factors":[124],"relating":[125],"quality":[128],"collected":[131],"terms":[134],"specified":[137],"considered.":[140],"result":[142],"approximately":[153,161],"11":[154],"hours":[155],"recorded":[157],"comprised":[159],"23500":[162],"sound":[163],"files":[164],"monophthongs":[167],"combinations":[170],"(e.g.":[171],"diphthongs)":[172],"chosen":[173],"for":[174,220],"project":[178],"varying":[179],"along":[180],"duration,":[184],"intensity":[185],"amplitude.":[187],"This":[188],"paper":[189],"discusses":[190],"how":[191],"has":[195],"since":[197],"its":[198],"initiation":[199],"provides":[201],"brief":[203],"summary":[204],"resulting":[207],"corpus.":[208],"Index":[209],"Terms:":[210],"Speech":[211,218],"corpora,":[212],"procedures,":[215],"recognition,":[217],"HCI":[219],"impairments,":[223],"Speech/voice-based":[224],"human-computer":[225],"interfaces":[226],"1.":[227]},"counts_by_year":[{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
