{"id":"https://openalex.org/W2396592486","doi":"https://doi.org/10.21437/interspeech.2012-589","title":"Predicting character-appropriate voices for a TTS-based storyteller system","display_name":"Predicting character-appropriate voices for a TTS-based storyteller system","publication_year":2012,"publication_date":"2012-09-09","ids":{"openalex":"https://openalex.org/W2396592486","doi":"https://doi.org/10.21437/interspeech.2012-589","mag":"2396592486"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2012-589","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-589","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012449048","display_name":"Erica Greene","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Erica Greene","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108191538","display_name":"Taniya Mishra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taniya Mishra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026605560","display_name":"Patrick Haffner","orcid":"https://orcid.org/0000-0002-2319-5109"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patrick Haffner","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028548414","display_name":"Alistair Conkie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alistair Conkie","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5012449048"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1598,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.82628529,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2210","last_page":"2213"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.7566267251968384},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.592219889163971},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4465324282646179},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4014263153076172},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.33186787366867065},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10149228572845459}],"concepts":[{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.7566267251968384},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.592219889163971},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4465324282646179},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4014263153076172},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.33186787366867065},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10149228572845459},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2012-589","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-589","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.306.9296","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.306.9296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www2.research.att.com/~ttsweb/tts/papers/2012/mishra_greene_v4.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W199841855","https://openalex.org/W1505422262","https://openalex.org/W1519756925","https://openalex.org/W2116705992","https://openalex.org/W2168493061","https://openalex.org/W2171121512","https://openalex.org/W2334456382"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W4251972423","https://openalex.org/W1503216044","https://openalex.org/W2393609567","https://openalex.org/W2369369044","https://openalex.org/W2354143083","https://openalex.org/W2372906645","https://openalex.org/W4319998713","https://openalex.org/W2366269494"],"abstract_inverted_index":{"Using":[0],"distinct":[1],"and":[2,23,45,101],"appropriate":[3,36,61],"synthetic":[4],"voices":[5,37,62,105],"to":[6,77,102],"voice":[7],"the":[8,31,59,79,88,104,114,132],"characters":[9,40,64],"in":[10,65,86,106,127],"a":[11,16,43,54,93,98],"children\u2019s":[12,66],"story":[13],"would":[14],"make":[15],"TTS-based":[17],"digital":[18],"storyteller":[19],"system":[20,122],"more":[21],"engaging":[22],"entertaining,":[24],"as":[25],"well":[26],"increase":[27],"listener\u2019s":[28],"comprehension":[29],"of":[30,134],"story.":[32],"However,":[33],"automatically":[34],"predicting":[35,58],"for":[38,57,63],"storybook":[39],"is":[41],"both":[42],"non-trivial":[44],"largely":[46],"unexplored":[47],"problem.":[48],"In":[49],"this":[50],"paper,":[51],"we":[52],"present":[53],"data-driven":[55],"approach":[56],"most":[60,84],"stories":[67],"based":[68],"on":[69],"salient":[70,85],"character":[71,80,95],"attributes.":[72],"We":[73,112],"use":[74],"Mechanical":[75],"Turk":[76],"identify":[78],"attributes":[81],"that":[82,92],"are":[83],"evoking":[87],"listeners":[89],"\u2019":[90],"perception":[91],"specific":[94],"should":[96],"have":[97],"particular":[99],"voice,":[100],"label":[103],"our":[107,135],"collection":[108],"with":[109,117],"attribute":[110],"tags.":[111],"model":[113],"attribute-to-voice":[115],"relationship":[116],"Naive":[118],"Bayes.":[119],"The":[120],"resulting":[121],"performs":[123],"significantly":[124],"above":[125],"chance":[126],"an":[128],"objective":[129],"evaluation,":[130],"demonstrating":[131],"viability":[133],"approach.":[136]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
