{"id":"https://openalex.org/W2095563672","doi":"https://doi.org/10.1109/tasl.2008.2011538","title":"Realistic Visual Speech Synthesis Based on Hybrid Concatenation Method","display_name":"Realistic Visual Speech Synthesis Based on Hybrid Concatenation Method","publication_year":2009,"publication_date":"2009-02-13","ids":{"openalex":"https://openalex.org/W2095563672","doi":"https://doi.org/10.1109/tasl.2008.2011538","mag":"2095563672"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2008.2011538","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2011538","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112613657","display_name":"Jianhua Tao","orcid":"https://orcid.org/0000-0002-9344-6428"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jianhua Tao","raw_affiliation_strings":["Chinese Academy of Sciences, Institute of Automation, Beijing, China","Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Automation, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070110825","display_name":"Le Xin","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Le Xin","raw_affiliation_strings":["Chinese Academy of Sciences, Institute of Automation, Beijing, China","Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Automation, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084271282","display_name":"Panrong Yin","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Panrong Yin","raw_affiliation_strings":["Chinese Academy of Sciences, Institute of Automation, Beijing, China","Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Automation, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Chinese Acad. of Sci., Beijing#TAB#","institution_ids":["https://openalex.org/I4210112150"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5112613657"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210112150"],"apc_list":null,"apc_paid":null,"fwci":5.6394,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.96286024,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"17","issue":"3","first_page":"469","last_page":"477"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9704999923706055,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.8783016204833984},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.8441319465637207},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8333125710487366},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5894982814788818},{"id":"https://openalex.org/keywords/viterbi-algorithm","display_name":"Viterbi algorithm","score":0.5404366850852966},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.5363990068435669},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5175082683563232},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4906965494155884},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48820358514785767},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44279342889785767},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0861501693725586}],"concepts":[{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.8783016204833984},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.8441319465637207},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8333125710487366},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5894982814788818},{"id":"https://openalex.org/C60582962","wikidata":"https://www.wikidata.org/wiki/Q83886","display_name":"Viterbi algorithm","level":3,"score":0.5404366850852966},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.5363990068435669},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5175082683563232},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4906965494155884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48820358514785767},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44279342889785767},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0861501693725586},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tasl.2008.2011538","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2011538","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320326873","display_name":"National Laboratory of Pattern Recognition","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W21323494","https://openalex.org/W33533989","https://openalex.org/W99444952","https://openalex.org/W116902681","https://openalex.org/W1547376871","https://openalex.org/W1589445648","https://openalex.org/W1826846938","https://openalex.org/W1972421820","https://openalex.org/W1980570665","https://openalex.org/W1986394836","https://openalex.org/W1988874269","https://openalex.org/W2019083158","https://openalex.org/W2047618352","https://openalex.org/W2047908040","https://openalex.org/W2070726616","https://openalex.org/W2103743127","https://openalex.org/W2105020570","https://openalex.org/W2105537028","https://openalex.org/W2108033344","https://openalex.org/W2110501904","https://openalex.org/W2111105420","https://openalex.org/W2117853077","https://openalex.org/W2133826808","https://openalex.org/W2137489111","https://openalex.org/W2142975523","https://openalex.org/W2143132120","https://openalex.org/W2147885303","https://openalex.org/W2152239535","https://openalex.org/W2153520663","https://openalex.org/W2157986450","https://openalex.org/W2160980460","https://openalex.org/W2161736993","https://openalex.org/W2170429722","https://openalex.org/W2295661697","https://openalex.org/W2765809530","https://openalex.org/W3151822565","https://openalex.org/W4240628542","https://openalex.org/W4244298416","https://openalex.org/W6600857284","https://openalex.org/W6604061577","https://openalex.org/W6604828220","https://openalex.org/W6632696956","https://openalex.org/W6675911463","https://openalex.org/W6676803799","https://openalex.org/W6681253763","https://openalex.org/W6682724930","https://openalex.org/W6745490303"],"related_works":["https://openalex.org/W1893636011","https://openalex.org/W2388979876","https://openalex.org/W2100982643","https://openalex.org/W24638226","https://openalex.org/W2615042318","https://openalex.org/W2008161911","https://openalex.org/W1479948762","https://openalex.org/W2107801270","https://openalex.org/W2744799066","https://openalex.org/W2095563672"],"abstract_inverted_index":{"This":[0],"paper":[1,122,164],"presents":[2],"a":[3,34,42,77,118,125,167],"realistic":[4],"visual":[5],"speech":[6],"synthesis":[7],"based":[8,17,179],"on":[9,18,117,180],"the":[10,29,65,93,98,103,110,114,133,140,147,153,163,189],"hybrid":[11,30],"concatenation":[12,31],"method.":[13],"Unlike":[14],"previous":[15],"methods":[16],"phoneme":[19],"level":[20,100],"unit":[21,37,94,115],"selection":[22,38,95,116],"or":[23],"hidden":[24],"Markov":[25],"model":[26,64],"(HMM),":[27],"etc.,":[28],"method":[32,39,96,129,169,190,207],"uses":[33],"frame":[35,99],"level-based":[36],"combined":[40],"with":[41,72,197,201,211],"fused":[43,57,84,104],"HMM,":[44],"and":[45,52,216],"is":[46,86,90],"able":[47],"to":[48,62,170,213],"generate":[49,171],"more":[50],"expressive":[51],"stable":[53],"facial":[54,88,173,177,195],"animations.":[55],"The":[56],"HMM":[58,79,85,105],"can":[59,192],"be":[60],"used":[61],"explicitly":[63],"loose":[66],"synchronization":[67],"of":[68,113],"tightly":[69],"coupled":[70],"streams,":[71],"much":[73],"better":[74,209],"results":[75],"than":[76],"normal":[78],"for":[80],"audiovisual":[81,203],"mapping.":[82],"After":[83],"created,":[87],"animation":[89],"generated":[91],"via":[92],"at":[97],"by":[101],"using":[102],"output":[106,193],"probabilities.":[107],"To":[108],"accelerate":[109],"computing":[111],"efficiency":[112],"large":[119],"corpus,":[120],"this":[121,151],"also":[123,165],"proposes":[124,166],"two-layer":[126],"Viterbi":[127],"search":[128],"in":[130,139,146],"which":[131],"only":[132],"subsets":[134],"that":[135,188],"have":[136],"been":[137,156],"selected":[138],"first":[141],"layer":[142],"are":[143],"further":[144],"checked":[145],"second":[148],"layer.":[149],"Using":[150],"idea,":[152],"system":[154,217],"has":[155,208],"successfully":[157],"integrated":[158],"into":[159],"real-time":[160],"applications.":[161],"Furthermore,":[162],"mapping":[168,204],"emotional":[172],"expressions":[174,178],"from":[175],"neutral":[176],"Gaussian":[181],"mixture":[182],"models":[183],"(GMMs).":[184],"Final":[185],"experiments":[186],"prove":[187],"described":[191],"synthesized":[194],"parameters":[196],"high":[198],"quality.":[199],"Compared":[200],"other":[202],"methods,":[205],"our":[206],"performance":[210],"respect":[212],"expressiveness,":[214],"stability,":[215],"running":[218],"speed.":[219]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
