{"id":"https://openalex.org/W2149244738","doi":"https://doi.org/10.1109/iscslp.2010.5684865","title":"Hierarchical pitch target model for Mandarin speech","display_name":"Hierarchical pitch target model for Mandarin speech","publication_year":2010,"publication_date":"2010-11-01","ids":{"openalex":"https://openalex.org/W2149244738","doi":"https://doi.org/10.1109/iscslp.2010.5684865","mag":"2149244738"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2010.5684865","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2010.5684865","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 7th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100389496","display_name":"Zhiping Zhang","orcid":"https://orcid.org/0009-0008-0452-3147"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiping Zhang","raw_affiliation_strings":["Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100772594","display_name":"Xinhao Wang","orcid":"https://orcid.org/0000-0002-0366-7543"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinhao Wang","raw_affiliation_strings":["Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020291213","display_name":"Yansuo Yu","orcid":"https://orcid.org/0000-0002-2603-7755"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yansuo Yu","raw_affiliation_strings":["Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084685506","display_name":"Xihong Wu","orcid":"https://orcid.org/0009-0004-5236-7469"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xihong Wu","raw_affiliation_strings":["Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Speech and Hearing Research Center, Key Laboratory of Machine Perception (Ministry of Education), Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100389496"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.451,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.74562225,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"378","last_page":"382"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/intonation","display_name":"Intonation (linguistics)","score":0.8360917568206787},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.7798082828521729},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7216956615447998},{"id":"https://openalex.org/keywords/pitch-contour","display_name":"Pitch contour","score":0.7148481607437134},{"id":"https://openalex.org/keywords/syllable","display_name":"Syllable","score":0.6918463706970215},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6873382329940796},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.5893568396568298},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5028652548789978},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39107954502105713},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.32448703050613403},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1624048352241516}],"concepts":[{"id":"https://openalex.org/C2781045179","wikidata":"https://www.wikidata.org/wiki/Q5576720","display_name":"Intonation (linguistics)","level":2,"score":0.8360917568206787},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.7798082828521729},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7216956615447998},{"id":"https://openalex.org/C2777895490","wikidata":"https://www.wikidata.org/wiki/Q7198848","display_name":"Pitch contour","level":2,"score":0.7148481607437134},{"id":"https://openalex.org/C109089402","wikidata":"https://www.wikidata.org/wiki/Q8188","display_name":"Syllable","level":2,"score":0.6918463706970215},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6873382329940796},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.5893568396568298},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5028652548789978},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39107954502105713},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32448703050613403},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1624048352241516},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp.2010.5684865","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2010.5684865","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 7th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W137920126","https://openalex.org/W1519124935","https://openalex.org/W1600722501","https://openalex.org/W1995118599","https://openalex.org/W1998981462","https://openalex.org/W2038276123","https://openalex.org/W2049686551","https://openalex.org/W2057007972","https://openalex.org/W2110332474","https://openalex.org/W2121399170","https://openalex.org/W2126289105","https://openalex.org/W3200634688","https://openalex.org/W4301420498","https://openalex.org/W6982117988"],"related_works":["https://openalex.org/W2222951281","https://openalex.org/W2272290179","https://openalex.org/W2068412075","https://openalex.org/W156219719","https://openalex.org/W27484908","https://openalex.org/W1966171935","https://openalex.org/W1607387412","https://openalex.org/W2005059380","https://openalex.org/W2150511655","https://openalex.org/W2142042197"],"abstract_inverted_index":{"In":[0],"this":[1],"study,":[2],"a":[3,58,110,114],"hierarchical":[4,59],"pitch":[5,36,44,55,63],"target":[6,56,64],"model":[7,31],"is":[8,38],"proposed":[9],"to":[10,47],"analyze":[11],"the":[12,34,42,48,62,75,79,82,118,125,135,139,142],"underlying":[13],"factors":[14,105],"of":[15,78,103,122,141],"tones":[16],"and":[17,53,81,99,124,134],"intonation":[18,84,97,126],"in":[19,26,50],"Mandarin":[20],"pitch,":[21],"which":[22],"can":[23,69,106],"be":[24,70,107],"applied":[25],"speech":[27,111],"synthesis":[28,136],"systems.":[29],"This":[30],"assumes":[32],"that":[33],"surface":[35],"contour":[37],"produced":[39],"by":[40,72,87,113],"approximating":[41],"sequential":[43],"targets":[45],"assigned":[46],"syllables":[49,123],"an":[51],"utterance,":[52],"each":[54,67],"possesses":[57],"structure.":[60],"Moreover,":[61],"associated":[65],"with":[66],"syllable":[68,80],"generated":[71],"adding":[73],"up":[74],"tonal":[76,120],"pattern":[77],"stepped":[83],"biases":[85],"contributed":[86],"higher":[88],"level":[89],"prosodic":[90,93,95,130],"units,":[91],"including":[92],"words,":[94],"phrases,":[96],"phrases":[98],"utterances.":[100],"The":[101],"parameters":[102],"these":[104],"learned":[108,119],"from":[109,128],"corpus":[112],"gradient":[115],"method.":[116],"Finally,":[117],"patterns":[121,127],"different":[129],"layers":[131],"are":[132],"illustrated,":[133],"experiments":[137],"show":[138],"effectiveness":[140],"presented":[143],"model.":[144]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
