{"id":"https://openalex.org/W7152692234","doi":"https://doi.org/10.48550/arxiv.2604.07273","title":"GenLCA: 3D Diffusion for Full-Body Avatars from In-the-Wild Videos","display_name":"GenLCA: 3D Diffusion for Full-Body Avatars from In-the-Wild Videos","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7152692234","doi":"https://doi.org/10.48550/arxiv.2604.07273"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07273","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07273","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07273","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133249928","display_name":"Yiqian Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wu, Yiqian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133284195","display_name":"Rawal Khirodkar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khirodkar, Rawal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072400499","display_name":"Egor Zakharov","orcid":"https://orcid.org/0000-0002-9880-9531"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zakharov, Egor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085847990","display_name":"Timur Bagautdinov","orcid":"https://orcid.org/0000-0001-6541-8086"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bagautdinov, Timur","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133281676","display_name":"Lei Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113802241","display_name":"Zhaoen Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Zhaoen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133280524","display_name":"Shunsuke Saito","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saito, Shunsuke","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133305644","display_name":"Xiaogang Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Xiaogang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133274997","display_name":"Junxuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Junxuan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5133249928"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7942000031471252,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7942000031471252,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.048900000751018524,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.035100001841783524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5695000290870667},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.5030999779701233},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.4318999946117401},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4296000003814697},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.4296000003814697},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.423799991607666},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.322299987077713},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.3215999901294708},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.31540000438690186}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.848800003528595},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6021999716758728},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5997999906539917},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5695000290870667},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.5030999779701233},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.4318999946117401},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.4296000003814697},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4296000003814697},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.423799991607666},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3598000109195709},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.322299987077713},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.3215999901294708},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.31540000438690186},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.3122999966144562},{"id":"https://openalex.org/C61265191","wikidata":"https://www.wikidata.org/wiki/Q767770","display_name":"Scale-invariant feature transform","level":3,"score":0.29429998993873596},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.29330000281333923},{"id":"https://openalex.org/C2780695315","wikidata":"https://www.wikidata.org/wiki/Q3799040","display_name":"Unobservable","level":2,"score":0.2912999987602234},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C2777897806","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3D modeling","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C78201319","wikidata":"https://www.wikidata.org/wiki/Q685727","display_name":"Grayscale","level":3,"score":0.26019999384880066},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.25850000977516174},{"id":"https://openalex.org/C153715457","wikidata":"https://www.wikidata.org/wiki/Q254183","display_name":"Augmented reality","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C29081049","wikidata":"https://www.wikidata.org/wiki/Q1364242","display_name":"Image stitching","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07273","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07273","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07273","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07273","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,151,194],"present":[1],"GenLCA,":[2],"a":[3,38,44,84,131,154,188,213],"diffusion-based":[4],"generative":[5],"model":[6,48,89,157,190],"for":[7],"generating":[8],"and":[9,16,31,72,144,166,203,206],"editing":[10,207],"photorealistic":[11],"full-body":[12,32,45],"avatars":[13,21],"from":[14,49],"text":[15],"image":[17],"inputs.":[18],"The":[19,34,216],"generated":[20],"are":[22],"faithful":[23],"to":[24,58,60,68,186],"the":[25,55,69,80,123,159,164,170,179,196],"inputs,":[26],"while":[27],"supporting":[28],"high-fidelity":[29,204],"facial":[30],"animations.":[33],"core":[35],"idea":[36],"is":[37,219],"novel":[39,132],"paradigm":[40],"that":[41,137],"enables":[42,178],"training":[43,56,135],"3D":[46,93,102,124],"diffusion":[47,134,156,189],"partially":[50],"observable":[51],"2D":[52],"data,":[53],"allowing":[54],"dataset":[57,81],"scale":[59,78],"millions":[61],"of":[62,74,112,181,198],"real-world":[63,106,183],"videos.":[64],"This":[65],"scalability":[66],"contributes":[67],"superior":[70],"photorealism":[71,165],"generalizability":[73],"GenLCA.":[75],"Specifically,":[76],"we":[77,129],"up":[79],"by":[82,169,212],"repurposing":[83],"pretrained":[85,171],"feed-forward":[86],"avatar":[87,172],"reconstruction":[88,173],"as":[90],"an":[91],"animatable":[92],"tokenizer,":[94],"which":[95],"encodes":[96],"unstructured":[97],"video":[98,184],"frames":[99],"into":[100],"structured":[101],"tokens.":[103,125],"However,":[104],"most":[105],"videos":[107],"only":[108,147],"provide":[109],"partial":[110],"observations":[111],"body":[113],"parts,":[114],"resulting":[115],"in":[116,122,192],"excessive":[117],"blurring":[118],"or":[119],"transparency":[120],"artifacts":[121],"To":[126],"address":[127],"this,":[128],"propose":[130],"visibility-aware":[133],"strategy":[136],"replaces":[138],"invalid":[139],"regions":[140],"with":[141],"learnable":[142],"tokens":[143],"computes":[145],"losses":[146],"over":[148],"valid":[149],"regions.":[150],"then":[152],"train":[153,187],"flow-based":[155],"on":[158],"token":[160],"dataset,":[161],"inherently":[162],"maintaining":[163],"animatability":[167],"provided":[168],"model.":[174],"Our":[175],"approach":[176],"effectively":[177],"use":[180],"large-scale":[182],"data":[185],"natively":[191],"3D.":[193],"demonstrate":[195],"efficacy":[197],"our":[199],"method":[200],"through":[201],"diverse":[202],"generation":[205],"results,":[208],"outperforming":[209],"existing":[210],"solutions":[211],"large":[214],"margin.":[215],"project":[217],"page":[218],"available":[220],"at":[221],"https://onethousandwu.com/GenLCA-Page.":[222]},"counts_by_year":[],"updated_date":"2026-04-10T06:07:51.998497","created_date":"2026-04-10T00:00:00"}
