{"id":"https://openalex.org/W2055675670","doi":"https://doi.org/10.1145/2491599.2491601","title":"Using multimodal speech production data to evaluate articulatory animation for audiovisual speech synthesis","display_name":"Using multimodal speech production data to evaluate articulatory animation for audiovisual speech synthesis","publication_year":2012,"publication_date":"2012-09-21","ids":{"openalex":"https://openalex.org/W2055675670","doi":"https://doi.org/10.1145/2491599.2491601","mag":"2055675670"},"language":"en","primary_location":{"id":"doi:10.1145/2491599.2491601","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2491599.2491601","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd Symposium on Facial Analysis and Animation","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1209.4982","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004840801","display_name":"Ingmar Steiner","orcid":"https://orcid.org/0000-0001-6415-5915"},"institutions":[{"id":"https://openalex.org/I100930933","display_name":"University College Dublin","ror":"https://ror.org/05m7pjf47","country_code":"IE","type":"education","lineage":["https://openalex.org/I100930933"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Ingmar Steiner","raw_affiliation_strings":["University College Dublin","university college dublin"],"affiliations":[{"raw_affiliation_string":"University College Dublin","institution_ids":["https://openalex.org/I100930933"]},{"raw_affiliation_string":"university college dublin","institution_ids":["https://openalex.org/I100930933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055415493","display_name":"Korin Richmond","orcid":"https://orcid.org/0000-0003-1450-8270"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Korin Richmond","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044130608","display_name":"Slim Ouni","orcid":"https://orcid.org/0000-0001-5286-7368"},"institutions":[{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Slim Ouni","raw_affiliation_strings":["Universit\u00e9 de Lorraine, LORIA, UMR"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Lorraine, LORIA, UMR","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121838"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004840801"],"corresponding_institution_ids":["https://openalex.org/I100930933"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.13690063,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9800000190734863,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/viseme","display_name":"Viseme","score":0.8399275541305542},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8036313056945801},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.7991970777511597},{"id":"https://openalex.org/keywords/articulation","display_name":"Articulation (sociology)","score":0.7535732984542847},{"id":"https://openalex.org/keywords/morphing","display_name":"Morphing","score":0.6870481371879578},{"id":"https://openalex.org/keywords/computer-facial-animation","display_name":"Computer facial animation","score":0.6750932931900024},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6684069633483887},{"id":"https://openalex.org/keywords/computer-animation","display_name":"Computer animation","score":0.5575538277626038},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.49588117003440857},{"id":"https://openalex.org/keywords/speech-production","display_name":"Speech production","score":0.48689404129981995},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4542522728443146},{"id":"https://openalex.org/keywords/production","display_name":"Production (economics)","score":0.41180163621902466},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29537081718444824},{"id":"https://openalex.org/keywords/speech-technology","display_name":"Speech technology","score":0.22614476084709167},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.13303667306900024}],"concepts":[{"id":"https://openalex.org/C33767174","wikidata":"https://www.wikidata.org/wiki/Q371190","display_name":"Viseme","level":4,"score":0.8399275541305542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8036313056945801},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.7991970777511597},{"id":"https://openalex.org/C2779337067","wikidata":"https://www.wikidata.org/wiki/Q4800961","display_name":"Articulation (sociology)","level":3,"score":0.7535732984542847},{"id":"https://openalex.org/C50637493","wikidata":"https://www.wikidata.org/wiki/Q1136781","display_name":"Morphing","level":2,"score":0.6870481371879578},{"id":"https://openalex.org/C138591656","wikidata":"https://www.wikidata.org/wiki/Q5157538","display_name":"Computer facial animation","level":4,"score":0.6750932931900024},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6684069633483887},{"id":"https://openalex.org/C69369342","wikidata":"https://www.wikidata.org/wiki/Q1401416","display_name":"Computer animation","level":3,"score":0.5575538277626038},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.49588117003440857},{"id":"https://openalex.org/C43617652","wikidata":"https://www.wikidata.org/wiki/Q7575399","display_name":"Speech production","level":2,"score":0.48689404129981995},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4542522728443146},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.41180163621902466},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29537081718444824},{"id":"https://openalex.org/C504749915","wikidata":"https://www.wikidata.org/wiki/Q9010971","display_name":"Speech technology","level":3,"score":0.22614476084709167},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.13303667306900024},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/2491599.2491601","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2491599.2491601","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd Symposium on Facial Analysis and Animation","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1209.4982","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1209.4982","pdf_url":"https://arxiv.org/pdf/1209.4982","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:HAL:hal-00734464v1","is_oa":false,"landing_page_url":"https://inria.hal.science/hal-00734464","pdf_url":null,"source":{"id":"https://openalex.org/S4406922461","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"3rd International Symposium on Facial Analysis and Animation - FAA 2012, Sep 2012, Vienna, Austria","raw_type":"Conference papers"},{"id":"pmh:oai:pure.ed.ac.uk:publications/2c6e0e49-4ee6-4eba-b25a-f39be6e9f890","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1209.4982","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1209.4982","pdf_url":"https://arxiv.org/pdf/1209.4982","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6299999952316284,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2065086021","https://openalex.org/W2184487591","https://openalex.org/W2231075402","https://openalex.org/W2405733111","https://openalex.org/W3002898516"],"related_works":["https://openalex.org/W2401811665","https://openalex.org/W1974357398","https://openalex.org/W2295574089","https://openalex.org/W2053099149","https://openalex.org/W2350195158","https://openalex.org/W1971408785","https://openalex.org/W1559261064","https://openalex.org/W1792455311","https://openalex.org/W2087756952","https://openalex.org/W3133492806"],"abstract_inverted_index":{"The":[0],"importance":[1],"of":[2,26,33,46,60,73],"modeling":[3],"speech":[4,10,65],"articulation":[5],"for":[6,76],"high-quality":[7],"audiovisual":[8],"(AV)":[9],"synthesis":[11],"is":[12],"widely":[13],"acknowledged.":[14],"Nevertheless,":[15],"while":[16],"state-of-the-art,":[17],"data-driven":[18],"approaches":[19],"to":[20,55],"facial":[21,61],"animation":[22,32,75],"can":[23],"make":[24],"use":[25,45],"sophisticated":[27],"motion":[28],"capture":[29],"techniques,":[30],"the":[31,34,38,56,71],"intraoral":[35],"articulators":[36],"(viz.":[37],"tongue,":[39],"jaw,":[40],"and":[41],"velum)":[42],"typically":[43],"makes":[44],"simple":[47],"rules":[48],"or":[49],"viseme":[50],"morphing,":[51],"in":[52],"stark":[53],"contrast":[54],"otherwise":[57],"high":[58],"quality":[59,72],"modeling.":[62],"Using":[63],"appropriate":[64],"production":[66],"data":[67],"could":[68],"significantly":[69],"improve":[70],"articulatory":[74],"AV":[77],"synthesis.":[78]},"counts_by_year":[{"year":2016,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
