{"id":"https://openalex.org/W272162490","doi":"https://doi.org/10.21437/interspeech.2004-332","title":"Improvement in corpus-based generation of F0 contours using generation process model for emotional speech synthesis","display_name":"Improvement in corpus-based generation of F0 contours using generation process model for emotional speech synthesis","publication_year":2004,"publication_date":"2004-10-04","ids":{"openalex":"https://openalex.org/W272162490","doi":"https://doi.org/10.21437/interspeech.2004-332","mag":"272162490"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2004-332","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-332","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108197272","display_name":"Keikichi Hirose","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Keikichi Hirose","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5108197272"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6971,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.75095016,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1349","last_page":"1352"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9556000232696533,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9498000144958496,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7849529981613159},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7595273852348328},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.6373178362846375},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.6372385025024414},{"id":"https://openalex.org/keywords/sadness","display_name":"Sadness","score":0.5665649771690369},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5256083011627197},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5195296406745911},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5028669238090515},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4503999948501587},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.43636754155158997},{"id":"https://openalex.org/keywords/anger","display_name":"Anger","score":0.41859108209609985},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.4157668352127075},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08399614691734314},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08080807328224182}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7849529981613159},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7595273852348328},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.6373178362846375},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.6372385025024414},{"id":"https://openalex.org/C2779812673","wikidata":"https://www.wikidata.org/wiki/Q169251","display_name":"Sadness","level":3,"score":0.5665649771690369},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5256083011627197},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5195296406745911},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5028669238090515},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4503999948501587},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.43636754155158997},{"id":"https://openalex.org/C2779302386","wikidata":"https://www.wikidata.org/wiki/Q79871","display_name":"Anger","level":2,"score":0.41859108209609985},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.4157668352127075},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08399614691734314},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08080807328224182},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2004-332","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-332","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.587.7710","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.587.7710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.gavo.t.u-tokyo.ac.jp/~mine/paper/PDF/2004/ICSLP_p1349-1352_t2004-10.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","score":0.5299999713897705,"display_name":"Gender equality"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W14719770","https://openalex.org/W39968598","https://openalex.org/W350299107","https://openalex.org/W1978440078","https://openalex.org/W2034277951","https://openalex.org/W2071399124","https://openalex.org/W2149425161","https://openalex.org/W2298932255","https://openalex.org/W2817387358"],"related_works":["https://openalex.org/W4365519294","https://openalex.org/W3031187173","https://openalex.org/W3135436127","https://openalex.org/W2805647211","https://openalex.org/W3179181153","https://openalex.org/W2100930849","https://openalex.org/W2557139663","https://openalex.org/W2073249509","https://openalex.org/W2481378124","https://openalex.org/W1980267738"],"abstract_inverted_index":{"In":[0],"our":[1],"fully":[2],"automatic":[3],"corpus-based":[4,214],"method":[5,28,106,160,204],"of":[6,24,45,48,55,81,104,122,138,147,155,187],"generating":[7],"fundamental":[8],"frequency":[9],"(F0)":[10],"contours":[11,175],"for":[12,99,176,183,243],"emotional":[13,82,188],"speech":[14,67,76,83,89,111,178,189],"synthesis,":[15],"an":[16],"improvement":[17],"was":[18,161,190,218],"realized":[19],"related":[20],"to":[21,51,163,181],"the":[22,30,49,56,70,100,105,117,120,123,127,136,142,152,159,171,201,206,221,225,229,236],"process":[23,32],"corpus":[25,77],"preparation.":[26],"The":[27,75,95,168,195,239],"assumes":[29],"generation":[31],"model":[33,57],"and":[34,87,173,205,224,245],"predicts":[35],"its":[36],"command":[37,96,149],"parameters":[38,97],"using":[39,112,220],"binary":[40],"regression":[41],"trees":[42],"with":[43,192],"inputs":[44],"linguistic":[46],"information":[47],"sentence":[50],"be":[52,232],"synthesized.":[53],"Because":[54],"constraint,":[58],"a":[59,92,113,130,212],"certain":[60],"quality":[61],"is":[62,72,132],"still":[63],"kept":[64],"in":[65,211],"synthesized":[66,222],"even":[68],"if":[69],"prediction":[71,128,150],"done":[73],"incorrectly.":[74],"includes":[78],"three":[79],"types":[80],"(anger,":[84],"joy,":[85],"sadness)":[86],"calm":[88,184],"uttered":[90],"by":[91,116,200,235],"female":[93],"narrator.":[94],"necessary":[98],"training":[101],"(and":[102],"testing)":[103],"were":[107,179,198],"automatically":[108],"extracted":[109],"from":[110],"program":[114],"developed":[115,237],"authors.":[118],"Since":[119],"accuracy":[121,154],"extraction":[124],"largely":[125],"affects":[126],"performance,":[129],"constraint":[131],"newly":[133],"applied":[134],"on":[135],"position":[137],"phrase":[139,148,165],"commands":[140,166],"during":[141],"extraction.":[143],"Also,":[144],"since":[145],"performance":[146],"dominates":[151],"overall":[153],"generated":[156],"F0":[157],"contours,":[158],"modified":[162],"predict":[164],"first.":[167],"mismatches":[169],"between":[170],"predicted":[172,210],"target":[174],"angry":[177],"similar":[180,213],"those":[182],"speech.":[185],"Synthesis":[186],"conducted":[191,219],"text":[193],"inputs.":[194],"segmental":[196],"features":[197],"handled":[199],"HMM":[202],"synthesis":[203],"phoneme":[207],"durations":[208],"are":[209],"method.":[215,238],"Perceptual":[216],"experiment":[217],"speech,":[223],"result":[226,240],"indicated":[227],"that":[228],"anger":[230],"could":[231],"well":[233],"conveyed":[234],"came":[241],"worse":[242],"joy":[244],"sadness.":[246],"1.":[247]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
