{"id":"https://openalex.org/W7109971032","doi":"https://doi.org/10.1145/3757377.3763842","title":"Uni3C: Unifying Precisely 3D-Enhanced Camera and Human Motion Controls for Video Generation","display_name":"Uni3C: Unifying Precisely 3D-Enhanced Camera and Human Motion Controls for Video Generation","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W7109971032","doi":"https://doi.org/10.1145/3757377.3763842"},"language":null,"primary_location":{"id":"doi:10.1145/3757377.3763842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3763842","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chenjie Cao","orcid":"https://orcid.org/0000-0003-3916-2843"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenjie Cao","raw_affiliation_strings":["Alibaba Group, Hangzhou, China and Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China and Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jingkai Zhou","orcid":"https://orcid.org/0000-0003-4629-0659"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingkai Zhou","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shikai Li","orcid":"https://orcid.org/0000-0002-9674-2556"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shikai Li","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jingyun Liang","orcid":"https://orcid.org/0000-0001-9841-8584"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyun Liang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chaohui Yu","orcid":"https://orcid.org/0000-0002-7852-4491"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaohui Yu","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fan Wang","orcid":"https://orcid.org/0000-0001-7320-1119"},"institutions":[{"id":"https://openalex.org/I4210095624","display_name":"Alibaba Group (United States)","ror":"https://ror.org/00rn0m335","country_code":"US","type":"company","lineage":["https://openalex.org/I4210095624","https://openalex.org/I45928872"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fan Wang","raw_affiliation_strings":["Alibaba Group, California, USA"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, California, USA","institution_ids":["https://openalex.org/I4210095624"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiangyang Xue","orcid":"https://orcid.org/0000-0002-4897-9209"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangyang Xue","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yanwei Fu","orcid":"https://orcid.org/0000-0002-6595-6893"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanwei Fu","raw_affiliation_strings":["Fudan University, Shanghai, China and Shanghai Innovation Institute, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China and Shanghai Innovation Institute, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I45928872"],"apc_list":null,"apc_paid":null,"fwci":1.2656,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85701993,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.6891000270843506,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.6891000270843506,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.14959999918937683,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.05869999900460243,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.536899983882904},{"id":"https://openalex.org/keywords/camera-auto-calibration","display_name":"Camera auto-calibration","score":0.4677000045776367},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.42010000348091125},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.41260001063346863},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.3930000066757202},{"id":"https://openalex.org/keywords/camera-resectioning","display_name":"Camera resectioning","score":0.3774999976158142},{"id":"https://openalex.org/keywords/motion-compensation","display_name":"Motion compensation","score":0.36660000681877136},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.3634999990463257},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.3603000044822693}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7932000160217285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7663999795913696},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7613999843597412},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.536899983882904},{"id":"https://openalex.org/C94816000","wikidata":"https://www.wikidata.org/wiki/Q5026006","display_name":"Camera auto-calibration","level":3,"score":0.4677000045776367},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.42010000348091125},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.41260001063346863},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.3930000066757202},{"id":"https://openalex.org/C110898773","wikidata":"https://www.wikidata.org/wiki/Q2933935","display_name":"Camera resectioning","level":2,"score":0.3774999976158142},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.36660000681877136},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.3634999990463257},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3603000044822693},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.3555000126361847},{"id":"https://openalex.org/C2778852477","wikidata":"https://www.wikidata.org/wiki/Q313614","display_name":"Video camera","level":2,"score":0.3384999930858612},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3212999999523163},{"id":"https://openalex.org/C2986578859","wikidata":"https://www.wikidata.org/wiki/Q657632","display_name":"Human motion","level":3,"score":0.3077999949455261},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C146159030","wikidata":"https://www.wikidata.org/wiki/Q7625099","display_name":"Structure from motion","level":3,"score":0.2939999997615814},{"id":"https://openalex.org/C95020103","wikidata":"https://www.wikidata.org/wiki/Q1813492","display_name":"Match moving","level":3,"score":0.2924000024795532},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.2847999930381775},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.28290000557899475},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.2660999894142151},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.26440000534057617},{"id":"https://openalex.org/C27402916","wikidata":"https://www.wikidata.org/wiki/Q31009","display_name":"Image stabilization","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C124774092","wikidata":"https://www.wikidata.org/wiki/Q6917782","display_name":"Motion field","level":3,"score":0.2538999915122986}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3757377.3763842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3763842","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2128019145","https://openalex.org/W2474702929","https://openalex.org/W2519683295","https://openalex.org/W2738551266","https://openalex.org/W2963557767","https://openalex.org/W2978956737","https://openalex.org/W3111114371","https://openalex.org/W3132270109","https://openalex.org/W3176252609","https://openalex.org/W3196466825","https://openalex.org/W3215769467","https://openalex.org/W4312369807","https://openalex.org/W4312635677","https://openalex.org/W4312639824","https://openalex.org/W4312933868","https://openalex.org/W4386071865","https://openalex.org/W4388284323","https://openalex.org/W4390872297","https://openalex.org/W4390873054","https://openalex.org/W4391622623","https://openalex.org/W4399563538","https://openalex.org/W4400573519","https://openalex.org/W4402704510","https://openalex.org/W4402704593","https://openalex.org/W4402704622","https://openalex.org/W4402727037","https://openalex.org/W4402754033","https://openalex.org/W4402754111","https://openalex.org/W4402775760","https://openalex.org/W4403624672","https://openalex.org/W4413144558","https://openalex.org/W4413145386","https://openalex.org/W4413145609","https://openalex.org/W4413146013","https://openalex.org/W4413146238","https://openalex.org/W4413146758","https://openalex.org/W4413147655","https://openalex.org/W4413513763"],"related_works":[],"abstract_inverted_index":{"Camera":[0],"and":[1,45,93,165,175,205,219],"human":[2,46,135,176,206,220],"motion":[3,47,136,190,207],"controls":[4],"have":[5],"been":[6],"extensively":[7],"studied":[8],"for":[9,26,39,154,173,191],"video":[10,49,67,98,195],"generation,":[11],"but":[12],"existing":[13],"approaches":[14],"typically":[15],"address":[16],"them":[17],"separately,":[18],"suffering":[19],"from":[20,76],"limited":[21],"data":[22],"with":[23,64],"high-quality":[24],"annotations":[25],"both":[27,43,161,202],"aspects.":[28],"To":[29],"overcome":[30],"this,":[31],"we":[32,57,146,210],"present":[33],"Uni3C,":[34],"a":[35,59,65,148],"unified":[36],"3D-enhanced":[37],"framework":[38],"precise":[40],"control":[41,61,133,171],"of":[42,90,97,108,122,194,226],"camera":[44,82,132,174,189,203,217],"in":[48,127,187,201],"generation.":[50,196],"Uni3C":[51,123,197],"includes":[52],"two":[53],"key":[54],"contributions.":[55],"First,":[56],"propose":[58,147],"plug-and-play":[60],"module":[62],"trained":[63,126],"frozen":[66,114],"generative":[68],"backbone,":[69],"PCDController,":[70],"which":[71],"utilizes":[72],"unprojected":[73],"point":[74,91,163],"clouds":[75,92,164],"monocular":[77],"depth":[78],"to":[79,124,168,222],"achieve":[80],"accurate":[81],"control.":[83],"By":[84],"leveraging":[85],"the":[86,94,110,139,155,170,224],"strong":[87,185],"3D":[88,151],"priors":[89],"powerful":[95],"capacities":[96],"foundational":[99],"models,":[100],"PCDController":[101,183],"shows":[102],"impressive":[103],"generalization,":[104],"performing":[105],"well":[106],"regardless":[107],"whether":[109],"inference":[111,156],"backbone":[112],"is":[113],"or":[115,134],"fine-tuned.":[116],"This":[117],"flexibility":[118],"enables":[119],"different":[120],"modules":[121],"be":[125],"specific":[128],"domains,":[129],"i.e.,":[130],"either":[131],"control,":[137],"reducing":[138],"dependency":[140],"on":[141],"jointly":[142,149],"annotated":[143],"data.":[144],"Second,":[145],"aligned":[150],"world":[152],"guidance":[153],"phase":[157],"that":[158,182],"seamlessly":[159],"integrates":[160],"scenic":[162],"SMPL-X":[166],"characters":[167],"unify":[169],"signals":[172],"motion,":[177],"respectively.":[178],"Extensive":[179],"experiments":[180],"confirm":[181],"enjoys":[184],"robustness":[186],"driving":[188],"fine-tuned":[192],"backbones":[193],"substantially":[198],"outperforms":[199],"competitors":[200],"controllability":[204],"quality.":[208],"Additionally,":[209],"collect":[211],"tailored":[212],"validation":[213],"sets":[214],"featuring":[215],"challenging":[216],"movements":[218],"actions":[221],"validate":[223],"effectiveness":[225],"our":[227],"method.":[228],"Codes":[229],"are":[230],"released":[231],"at":[232],"https://github.com/alibaba-damo-academy/Uni3C.":[233]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-10T02:45:41.426853","created_date":"2025-12-08T00:00:00"}
