{"id":"https://openalex.org/W4399317045","doi":"https://doi.org/10.1145/3641233.3664312","title":"Audio2Rig: Artist-oriented deep learning tool for facial and lip sync animation","display_name":"Audio2Rig: Artist-oriented deep learning tool for facial and lip sync animation","publication_year":2024,"publication_date":"2024-07-18","ids":{"openalex":"https://openalex.org/W4399317045","doi":"https://doi.org/10.1145/3641233.3664312"},"language":"en","primary_location":{"id":"doi:10.1145/3641233.3664312","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3641233.3664312","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGGRAPH 2024 Talks","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.20412","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068986229","display_name":"Bastien Arcelin","orcid":"https://orcid.org/0000-0002-3553-792X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bastien Arcelin","raw_affiliation_strings":["Golaem, France","Golaem Rennes, France"],"raw_orcid":"https://orcid.org/0000-0002-3553-792X","affiliations":[{"raw_affiliation_string":"Golaem, France","institution_ids":[]},{"raw_affiliation_string":"Golaem Rennes, France","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022836069","display_name":"Nicolas Chaverou","orcid":"https://orcid.org/0009-0003-8659-0880"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nicolas Chaverou","raw_affiliation_strings":["Golaem, Nw Caledonia"],"raw_orcid":"https://orcid.org/0009-0003-8659-0880","affiliations":[{"raw_affiliation_string":"Golaem, Nw Caledonia","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068986229"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2381,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.47781982,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9703999757766724,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9703999757766724,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sync","display_name":"sync","score":0.8298523426055908},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.6973366737365723},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6961249709129333},{"id":"https://openalex.org/keywords/computer-facial-animation","display_name":"Computer facial animation","score":0.6850355267524719},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.4704272747039795},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44612210988998413},{"id":"https://openalex.org/keywords/computer-animation","display_name":"Computer animation","score":0.3919413089752197},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3533521592617035},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.33199605345726013}],"concepts":[{"id":"https://openalex.org/C3913047","wikidata":"https://www.wikidata.org/wiki/Q1956265","display_name":"sync","level":3,"score":0.8298523426055908},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.6973366737365723},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6961249709129333},{"id":"https://openalex.org/C138591656","wikidata":"https://www.wikidata.org/wiki/Q5157538","display_name":"Computer facial animation","level":4,"score":0.6850355267524719},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.4704272747039795},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44612210988998413},{"id":"https://openalex.org/C69369342","wikidata":"https://www.wikidata.org/wiki/Q1401416","display_name":"Computer animation","level":3,"score":0.3919413089752197},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3533521592617035},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.33199605345726013},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3641233.3664312","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3641233.3664312","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGGRAPH 2024 Talks","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2405.20412","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.20412","pdf_url":"https://arxiv.org/pdf/2405.20412","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.20412","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.20412","pdf_url":"https://arxiv.org/pdf/2405.20412","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399317045.pdf","grobid_xml":"https://content.openalex.org/works/W4399317045.grobid-xml"},"referenced_works_count":2,"referenced_works":["https://openalex.org/W2739192055","https://openalex.org/W4385623693"],"related_works":["https://openalex.org/W1544039745","https://openalex.org/W2121378366","https://openalex.org/W2999276620","https://openalex.org/W2532377291","https://openalex.org/W1976926596","https://openalex.org/W2989004599","https://openalex.org/W2535923857","https://openalex.org/W3094080214","https://openalex.org/W2156310872","https://openalex.org/W2356609371"],"abstract_inverted_index":{"Creating":[0],"realistic":[1],"or":[2,159,175],"stylized":[3,96],"facial":[4,69],"and":[5,18,26,45,70,91,95,169,179,211,219],"lip":[6,71],"sync":[7,21,72],"animation":[8,74,120,195],"is":[9,127,212],"a":[10,54,65],"tedious":[11],"task.":[12],"It":[13],"requires":[14],"lot":[15],"of":[16,48,64,102,140,151],"time":[17,41],"skills":[19],"to":[20,31,38,67,173],"the":[22,28,32,43,49,100,103,108,116,119,152,156,177,185,199,204,208],"lips":[23,158],"with":[24],"audio":[25,77],"convey":[27],"right":[29],"emotion":[30],"character\u2019s":[33],"face.":[34],"To":[35],"allow":[36],"animators":[37,163],"spend":[39],"more":[40],"on":[42,115,129,184,207],"artistic":[44],"creative":[46],"part":[47],"animation,":[50],"we":[51],"present":[52],"Audio2Rig:":[53],"new":[55],"deep":[56],"learning":[57],"based":[58,128],"tool":[59],"leveraging":[60],"previously":[61],"animated":[62],"sequences":[63],"show,":[66],"generate":[68],"rig":[73,87,117],"from":[75,84,221],"an":[76,137],"file.":[78],"Based":[79],"in":[80,107],"Maya,":[81],"it":[82,112,215],"learns":[83],"any":[85,89],"production":[86],"without":[88],"adjustment":[90],"generates":[92,113],"high":[93,181],"quality":[94],"animations":[97],"which":[98,134],"mimic":[99],"style":[101],"show.":[104],"Audio2Rig":[105],"fits":[106],"animator":[109],"workflow:":[110],"since":[111],"keys":[114],"controllers,":[118],"can":[121,135,145,164],"be":[122,146],"easily":[123],"retaken.":[124],"The":[125],"method":[126,189],"3":[130],"neural":[131],"network":[132],"modules":[133],"learn":[136],"arbitrary":[138],"number":[139],"controllers.":[141],"Hence,":[142],"different":[143,167],"configurations":[144],"created":[147],"for":[148],"specific":[149],"parts":[150],"face":[153],"(such":[154],"as":[155,203],"tongue,":[157],"eyes).":[160],"With":[161],"Audio2Rig,":[162],"also":[165],"pick":[166],"emotions":[168],"adjust":[170],"their":[171],"intensities":[172],"experiment":[174],"customize":[176],"output,":[178],"have":[180],"level":[182],"controls":[183],"keyframes":[186],"setting.":[187],"Our":[188],"shows":[190],"excellent":[191],"results,":[192],"generating":[193],"fine":[194],"details":[196],"while":[197],"respecting":[198],"show":[200],"style.":[201],"Finally,":[202],"training":[205],"relies":[206],"studio":[209],"data":[210,217],"done":[213],"internally,":[214],"ensures":[216],"privacy":[218],"prevents":[220],"copyright":[222],"infringement.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2024-06-04T00:00:00"}
