{"id":"https://openalex.org/W7148793960","doi":"https://doi.org/10.48550/arxiv.2604.01666","title":"DynaVid: Learning to Generate Highly Dynamic Videos using Synthetic Motion Data","display_name":"DynaVid: Learning to Generate Highly Dynamic Videos using Synthetic Motion Data","publication_year":2026,"publication_date":"2026-04-02","ids":{"openalex":"https://openalex.org/W7148793960","doi":"https://doi.org/10.48550/arxiv.2604.01666"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01666","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060056889","display_name":"Wonjoon Jin","orcid":"https://orcid.org/0000-0001-6883-3920"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Wonjoon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132903557","display_name":"Jiyun Won","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Won, Jiyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132905699","display_name":"Janghyeok Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Janghyeok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132886080","display_name":"Qi Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132831348","display_name":"Chong Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Chong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031628798","display_name":"Seung-Hwan Baek","orcid":"https://orcid.org/0000-0002-8635-4277"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baek, Seung-Hwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132852256","display_name":"Sunghyun Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Sunghyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5422000288963318,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5422000288963318,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.23270000517368317,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.09399999678134918,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.6437000036239624},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.6312000155448914},{"id":"https://openalex.org/keywords/motion-interpolation","display_name":"Motion interpolation","score":0.598800003528595},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5662000179290771},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.5336999893188477},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.5223000049591064},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.4625000059604645},{"id":"https://openalex.org/keywords/quarter-pixel-motion","display_name":"Quarter-pixel motion","score":0.454800009727478}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7324000000953674},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7109000086784363},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7019000053405762},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.6437000036239624},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.6312000155448914},{"id":"https://openalex.org/C72560505","wikidata":"https://www.wikidata.org/wiki/Q204510","display_name":"Motion interpolation","level":5,"score":0.598800003528595},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5662000179290771},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.5336999893188477},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.5223000049591064},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.4625000059604645},{"id":"https://openalex.org/C174493125","wikidata":"https://www.wikidata.org/wiki/Q1073461","display_name":"Quarter-pixel motion","level":3,"score":0.454800009727478},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.4180999994277954},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.4052000045776367},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.38420000672340393},{"id":"https://openalex.org/C124774092","wikidata":"https://www.wikidata.org/wiki/Q6917782","display_name":"Motion field","level":3,"score":0.37560001015663147},{"id":"https://openalex.org/C95020103","wikidata":"https://www.wikidata.org/wiki/Q1813492","display_name":"Match moving","level":3,"score":0.36309999227523804},{"id":"https://openalex.org/C77660652","wikidata":"https://www.wikidata.org/wiki/Q150971","display_name":"Computer graphics","level":2,"score":0.32760000228881836},{"id":"https://openalex.org/C146159030","wikidata":"https://www.wikidata.org/wiki/Q7625099","display_name":"Structure from motion","level":3,"score":0.3043000102043152},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C2780575108","wikidata":"https://www.wikidata.org/wiki/Q7316652","display_name":"Retargeting","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.25999999046325684}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"recent":[1],"progress,":[2],"video":[3,43,139,142],"diffusion":[4],"models":[5,110],"still":[6],"struggle":[7],"to":[8,85,154],"synthesize":[9],"realistic":[10],"videos":[11,93],"involving":[12],"highly":[13],"dynamic":[14,156,203],"motions":[15],"or":[16],"requiring":[17],"fine-grained":[18],"motion":[19,49,73,76,102,130,157,179,184,204,208],"controllability.":[20],"A":[21],"central":[22],"limitation":[23],"lies":[24],"in":[25,31,51,202],"the":[26,113,152,198],"scarcity":[27],"of":[28,116],"such":[29],"examples":[30],"commonly":[32],"used":[33],"training":[34],"datasets.":[35],"To":[36],"address":[37],"this,":[38],"we":[39],"introduce":[40],"DynaVid,":[41],"a":[42,125,129,137],"synthesis":[44],"framework":[45,172],"that":[46,82,146,195],"leverages":[47],"synthetic":[48,72,117,160],"data":[50,161],"training,":[52],"which":[53],"is":[54,104],"represented":[55],"as":[56],"optical":[57,98],"flow":[58,99],"and":[59,78,103,135,181,200,206],"rendered":[60,92,97],"using":[61],"computer":[62],"graphics":[63],"pipelines.":[64],"This":[65,148],"approach":[66],"offers":[67,74],"two":[68,174],"key":[69],"advantages.":[70],"First,":[71],"diverse":[75],"patterns":[77,158],"precise":[79],"control":[80],"signals":[81],"are":[83,189],"difficult":[84],"obtain":[86],"from":[87,106,111,159,166],"real":[88],"data.":[89],"Second,":[90],"unlike":[91],"with":[94],"artificial":[95],"appearances,":[96],"encodes":[100],"only":[101],"decoupled":[105,149],"appearance,":[107],"thereby":[108],"preventing":[109],"reproducing":[112],"unnatural":[114],"look":[115],"videos.":[118,168],"Building":[119],"on":[120,145,173],"this":[121],"idea,":[122],"DynaVid":[123,196],"adopts":[124],"two-stage":[126],"generation":[127,180,205],"framework:":[128],"generator":[131,140],"first":[132],"synthesizes":[133],"motion,":[134],"then":[136],"motion-guided":[138],"produces":[141],"frames":[143],"conditioned":[144],"motion.":[147],"formulation":[150],"enables":[151],"model":[153],"learn":[155],"while":[162],"preserving":[163],"visual":[164],"realism":[165,199],"real-world":[167],"We":[169],"validate":[170],"our":[171],"challenging":[175],"scenarios,":[176],"vigorous":[177],"human":[178],"extreme":[182],"camera":[183,207],"control,":[185],"where":[186],"existing":[187],"datasets":[188],"particularly":[190],"limited.":[191],"Extensive":[192],"experiments":[193],"demonstrate":[194],"improves":[197],"controllability":[201],"control.":[209]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-04T00:00:00"}
