{"id":"https://openalex.org/W3081492798","doi":"https://doi.org/10.1145/3394171.3413532","title":"A Lip Sync Expert Is All You Need for Speech to Lip Generation In the Wild","display_name":"A Lip Sync Expert Is All You Need for Speech to Lip Generation In the Wild","publication_year":2020,"publication_date":"2020-10-12","ids":{"openalex":"https://openalex.org/W3081492798","doi":"https://doi.org/10.1145/3394171.3413532","mag":"3081492798"},"language":"en","primary_location":{"id":"doi:10.1145/3394171.3413532","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3394171.3413532","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2008.10010","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031415279","display_name":"K R Prajwal","orcid":null},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"K R Prajwal","raw_affiliation_strings":["International Institute of Information Technology, Hyderabad, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology, Hyderabad, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007660270","display_name":"Rudrabha Mukhopadhyay","orcid":"https://orcid.org/0009-0000-6628-7065"},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rudrabha Mukhopadhyay","raw_affiliation_strings":["International Institute of Information Technology, Hyderabad, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology, Hyderabad, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007109424","display_name":"Vinay P. Namboodiri","orcid":"https://orcid.org/0000-0001-5262-9722"},"institutions":[{"id":"https://openalex.org/I51601045","display_name":"University of Bath","ror":"https://ror.org/002h8g185","country_code":"GB","type":"education","lineage":["https://openalex.org/I51601045"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Vinay P. Namboodiri","raw_affiliation_strings":["University of Bath, Bath, United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Bath, Bath, United Kingdom","institution_ids":["https://openalex.org/I51601045"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053112307","display_name":"C. V. Jawahar","orcid":"https://orcid.org/0000-0001-6767-7057"},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"C.V. Jawahar","raw_affiliation_strings":["International Institute of Information Technology, Hyderabad, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology, Hyderabad, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5031415279"],"corresponding_institution_ids":["https://openalex.org/I64189192"],"apc_list":null,"apc_paid":null,"fwci":45.1596,"has_fulltext":true,"cited_by_count":796,"citation_normalized_percentile":{"value":0.9991516,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"484","last_page":"492"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13289","display_name":"Infant Health and Development","score":0.9039999842643738,"subfield":{"id":"https://openalex.org/subfields/3611","display_name":"Pharmacy"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sync","display_name":"sync","score":0.8140698671340942},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5946795344352722},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5630682706832886},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.16823655366897583}],"concepts":[{"id":"https://openalex.org/C3913047","wikidata":"https://www.wikidata.org/wiki/Q1956265","display_name":"sync","level":3,"score":0.8140698671340942},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5946795344352722},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5630682706832886},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.16823655366897583},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3394171.3413532","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3394171.3413532","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2008.10010","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.10010","pdf_url":"https://arxiv.org/pdf/2008.10010","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:purehost.bath.ac.uk:openaire/1de8a9c1-df3d-48e6-8062-061ade1d0e9d","is_oa":true,"landing_page_url":"https://researchportal.bath.ac.uk/en/publications/1de8a9c1-df3d-48e6-8062-061ade1d0e9d","pdf_url":"https://purehost.bath.ac.uk/ws/files/211225619/Wav2Lip_ACMMM_20_camera_ready_2_.pdf","source":{"id":"https://openalex.org/S4377196294","display_name":"Pure (University of Bath)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I51601045","host_organization_name":"University of Bath","host_organization_lineage":["https://openalex.org/I51601045"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Prajwal, K R, Mukhopadhyay, R, Namboodiri, V & Jawahar, C V 2020, A Lip Sync Expert Is All You Need for Speech to Lip Generation In the Wild. in 28th ACM International Conference on Multimedia (ACM MM). Association for Computing Machinery, Seattle, USA, pp. 484\u2013492. https://doi.org/10.1145/3394171.3413532","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2008.10010","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.10010","pdf_url":"https://arxiv.org/pdf/2008.10010","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6899999976158142,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2015143272","https://openalex.org/W2029199293","https://openalex.org/W2133665775","https://openalex.org/W2146502635","https://openalex.org/W2194775991","https://openalex.org/W2502312327","https://openalex.org/W2594690981","https://openalex.org/W2604379605","https://openalex.org/W2613087992","https://openalex.org/W2738406145","https://openalex.org/W2782422271","https://openalex.org/W2883082281","https://openalex.org/W2890952074","https://openalex.org/W2891205112","https://openalex.org/W2914217321","https://openalex.org/W2944294033","https://openalex.org/W2960274051","https://openalex.org/W2963081548","https://openalex.org/W2963290645","https://openalex.org/W2964171275","https://openalex.org/W2969174745","https://openalex.org/W2970868842","https://openalex.org/W2979894294","https://openalex.org/W2995238198","https://openalex.org/W3035446294","https://openalex.org/W3036381647","https://openalex.org/W3038930935","https://openalex.org/W3097792222","https://openalex.org/W3105763085","https://openalex.org/W4240153047","https://openalex.org/W4298205916","https://openalex.org/W4394665544"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4392306433","https://openalex.org/W2524993630","https://openalex.org/W2063547430","https://openalex.org/W2607244263","https://openalex.org/W2234430299","https://openalex.org/W1831690014","https://openalex.org/W1561022130"],"abstract_inverted_index":{"In":[0],"this":[1,82],"work,":[2],"we":[3,95],"investigate":[4],"the":[5,42,51,68,73,120,124,146,157],"problem":[6],"of":[7,13,37,54,67,123,149],"lip-syncing":[8],"a":[9,19,32,90,141],"talking":[10,60],"face":[11,61],"video":[12,69,143],"an":[14],"arbitrary":[15,55],"identity":[16],"to":[17,48,81,103],"match":[18],"target":[20],"speech":[21],"segment.":[22],"Current":[23],"works":[24],"excel":[25],"at":[26],"producing":[27],"accurate":[28],"lip":[29,52,106],"movements":[30,53],"on":[31,114,163],"static":[33],"image":[34],"or":[35],"videos":[36,125],"specific":[38],"people":[39],"seen":[40],"during":[41],"training":[43],"phase.":[44],"However,":[45],"they":[46],"fail":[47],"accurately":[49,104],"morph":[50],"identities":[56],"in":[57,64,108],"dynamic,":[58],"unconstrained":[59,109],"videos,":[62],"resulting":[63],"significant":[65],"parts":[66],"being":[70],"out-of-sync":[71],"with":[72],"new":[74],"audio.":[75],"We":[76,139],"identify":[77],"key":[78],"reasons":[79],"pertaining":[80],"and":[83,101,153,160],"hence":[84],"resolve":[85],"them":[86],"by":[87,127],"learning":[88],"from":[89],"powerful":[91],"lip-sync":[92,121],"discriminator.":[93],"Next,":[94],"propose":[96],"new,":[97],"rigorous":[98],"evaluation":[99,161],"benchmarks":[100,117,162],"metrics":[102],"measure":[105],"synchronization":[107],"videos.":[110,138],"Extensive":[111],"quantitative":[112],"evaluations":[113],"our":[115,128,150,164],"challenging":[116],"show":[118],"that":[119],"accuracy":[122],"generated":[126],"Wav2Lip":[129,151],"model":[130],"is":[131],"almost":[132],"as":[133,135],"good":[134],"real":[136],"synced":[137],"provide":[140],"demo":[142],"clearly":[144],"showing":[145],"substantial":[147],"impact":[148],"model,":[152],"also":[154],"publicly":[155],"release":[156],"code,":[158],"models,":[159],"website.":[165]},"counts_by_year":[{"year":2026,"cited_by_count":71},{"year":2025,"cited_by_count":222},{"year":2024,"cited_by_count":206},{"year":2023,"cited_by_count":162},{"year":2022,"cited_by_count":75},{"year":2021,"cited_by_count":56},{"year":2020,"cited_by_count":4}],"updated_date":"2026-06-04T09:04:59.091469","created_date":"2020-11-23T00:00:00"}
