{"id":"https://openalex.org/W4224920309","doi":"https://doi.org/10.1109/icassp43922.2022.9747663","title":"TalkingFlow: Talking Facial Landmark Generation with Multi-Scale Normalizing Flow Network","display_name":"TalkingFlow: Talking Facial Landmark Generation with Multi-Scale Normalizing Flow Network","publication_year":2022,"publication_date":"2022-04-27","ids":{"openalex":"https://openalex.org/W4224920309","doi":"https://doi.org/10.1109/icassp43922.2022.9747663"},"language":"en","primary_location":{"id":"doi:10.1109/icassp43922.2022.9747663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747663","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100745999","display_name":"Sen Liang","orcid":"https://orcid.org/0000-0001-5511-2614"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Sen Liang","raw_affiliation_strings":["Zhejiang University,State Key Lab of CAD&#x0026;CG","Zhejiang Lab"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,State Key Lab of CAD&#x0026;CG","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Zhejiang Lab","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050539684","display_name":"Zhize Zhou","orcid":"https://orcid.org/0000-0001-9576-1686"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhize Zhou","raw_affiliation_strings":["Zhejiang University,State Key Lab of CAD&#x0026;CG"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,State Key Lab of CAD&#x0026;CG","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017923507","display_name":"Rong Li","orcid":"https://orcid.org/0000-0001-5894-1434"},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rong Li","raw_affiliation_strings":["Zhejiang Lab"],"affiliations":[{"raw_affiliation_string":"Zhejiang Lab","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101904821","display_name":"Juyong Zhang","orcid":"https://orcid.org/0000-0002-1805-1426"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Juyong Zhang","raw_affiliation_strings":["University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059021869","display_name":"Hujun Bao","orcid":"https://orcid.org/0000-0002-2662-0334"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hujun Bao","raw_affiliation_strings":["Zhejiang University,State Key Lab of CAD&#x0026;CG","Zhejiang Lab"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,State Key Lab of CAD&#x0026;CG","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"Zhejiang Lab","institution_ids":["https://openalex.org/I4210123185"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100745999"],"corresponding_institution_ids":["https://openalex.org/I4210123185","https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.1798,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.47996578,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"4628","last_page":"4632"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/landmark","display_name":"Landmark","score":0.8452073335647583},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8019567131996155},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5336604118347168},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5175334811210632},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.49440455436706543},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.44868505001068115},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.44621849060058594},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4157651960849762},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.413382351398468},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3760348856449127},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.15536129474639893}],"concepts":[{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.8452073335647583},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8019567131996155},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5336604118347168},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5175334811210632},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.49440455436706543},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.44868505001068115},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.44621849060058594},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4157651960849762},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.413382351398468},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3760348856449127},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.15536129474639893},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp43922.2022.9747663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747663","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1959608418","https://openalex.org/W2015143272","https://openalex.org/W2423557781","https://openalex.org/W2604379605","https://openalex.org/W2738406145","https://openalex.org/W2795230330","https://openalex.org/W2918222882","https://openalex.org/W2944294033","https://openalex.org/W2945629925","https://openalex.org/W2963300588","https://openalex.org/W3019952993","https://openalex.org/W3047371217","https://openalex.org/W3096831136","https://openalex.org/W3107666850","https://openalex.org/W3107914916","https://openalex.org/W3109114891","https://openalex.org/W3160318142","https://openalex.org/W3174763799","https://openalex.org/W4200174933","https://openalex.org/W4288558691","https://openalex.org/W4289761690","https://openalex.org/W4295312788","https://openalex.org/W4297798428","https://openalex.org/W6640963894","https://openalex.org/W6714644935","https://openalex.org/W6735927292","https://openalex.org/W6752910514","https://openalex.org/W6759845760","https://openalex.org/W6759977823","https://openalex.org/W6766978945","https://openalex.org/W6795283348"],"related_works":["https://openalex.org/W2056853153","https://openalex.org/W2057559274","https://openalex.org/W2005087563","https://openalex.org/W2378111931","https://openalex.org/W4243161226","https://openalex.org/W2010533810","https://openalex.org/W2950647290","https://openalex.org/W2356918560","https://openalex.org/W1968481813","https://openalex.org/W2392886708"],"abstract_inverted_index":{"Deterministic":[0],"models":[1,35],"dominate":[2],"the":[3,28],"field":[4],"of":[5],"talking":[6,62],"facial":[7,19,63,107],"land-mark":[8],"generation":[9],"by":[10,74],"directly":[11],"mapping":[12],"speech":[13,69,93,110],"signals":[14],"to":[15,27,39,59,79,91],"a":[16,53,75,85],"certain":[17],"lip-sync":[18],"landmark":[20,64,108],"sequence,":[21],"which":[22],"often":[23],"suffer":[24],"from":[25,68,109],"regression":[26],"mean":[29],"face.":[30],"In":[31,48],"contrast,":[32],"probability":[33],"generative":[34],"are":[36],"more":[37],"beneficial":[38],"handle":[40],"complex":[41],"data":[42],"space":[43],"and":[44,84,105],"generate":[45,60,103],"diverse":[46,104],"samples.":[47],"this":[49],"work,":[50],"we":[51],"pro-pose":[52],"flow-based":[54],"probabilistic":[55],"network":[56],"named":[57],"TalkingFlow":[58],"natural":[61,106],"with":[65],"head":[66],"movements":[67],"data.":[70,94,111],"It":[71],"is":[72],"implemented":[73],"weighted":[76],"multi-scale":[77],"architecture":[78],"improve":[80],"model":[81],"representation":[82],"capability":[83],"conditional":[86],"Temporal":[87],"Convolutional":[88],"Network":[89],"module":[90],"fuse":[92],"Extensive":[95],"experiments":[96],"results":[97],"show":[98],"that":[99],"it":[100],"can":[101],"effectively":[102],"All":[112],"code":[113],"will":[114],"be":[115],"made":[116],"publicly":[117],"available":[118],"online.":[119]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
