{"id":"https://openalex.org/W7152375409","doi":"https://doi.org/10.48550/arxiv.2604.06339","title":"Evolution of Video Generative Foundations","display_name":"Evolution of Video Generative Foundations","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7152375409","doi":"https://doi.org/10.48550/arxiv.2604.06339"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.06339","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06339","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.06339","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133271377","display_name":"Teng Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hu, Teng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133296695","display_name":"Jiangning Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiangning","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133306188","display_name":"Hongrui Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Hongrui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133264336","display_name":"Ran Yi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi, Ran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133303938","display_name":"Zihan Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Zihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102655264","display_name":"Jieyu Weng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weng, Jieyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133271749","display_name":"Zhucun Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Zhucun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093580225","display_name":"Lizhuang MA","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Lizhuang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133277748","display_name":"Ming-Hsuan Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Ming-Hsuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133311125","display_name":"Dacheng Tao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao, Dacheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5133271377"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8432000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8432000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.026799999177455902,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.012199999764561653,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5996999740600586},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5967000126838684},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4345000088214874},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.39010000228881836},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.3822000026702881},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.37130001187324524},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.30250000953674316}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7286999821662903},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5996999740600586},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5967000126838684},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5037999749183655},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4345000088214874},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.39010000228881836},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.3822000026702881},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.37130001187324524},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35199999809265137},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3149000108242035},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.31119999289512634},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C207267971","wikidata":"https://www.wikidata.org/wiki/Q120208","display_name":"Emerging technologies","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.27730000019073486},{"id":"https://openalex.org/C138673069","wikidata":"https://www.wikidata.org/wiki/Q322229","display_name":"Tracing","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.06339","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06339","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.06339","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06339","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5209521055221558}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"advancement":[2],"of":[3,106,120,123,150,171],"Artificial":[4],"Intelligence":[5],"Generated":[6],"Content":[7],"(AIGC)":[8],"has":[9],"revolutionized":[10],"video":[11,68,89,124,166,196],"generation,":[12,167],"enabling":[13],"systems":[14],"ranging":[15],"from":[16,130],"proprietary":[17],"pioneers":[18],"like":[19,31],"OpenAI's":[20],"Sora,":[21],"Google's":[22],"Veo3,":[23],"and":[24,33,39,61,81,104,137,142,156,184,198,211],"Bytedance's":[25],"Seedance":[26],"to":[27,35,133,139,175,191,225],"powerful":[28],"open-source":[29],"contenders":[30],"Wan":[32],"HunyuanVideo":[34],"synthesize":[36],"temporally":[37],"coherent":[38],"semantically":[40],"rich":[41],"videos.":[42],"These":[43],"advancements":[44],"pave":[45],"the":[46,96,121,151,169,226],"way":[47],"for":[48],"building":[49],"\"world":[50],"models\"":[51],"that":[52],"simulate":[53],"real-world":[54],"dynamics,":[55],"with":[56],"applications":[57],"spanning":[58],"entertainment,":[59,210],"education,":[60,205],"virtual":[62],"reality.":[63],"However,":[64],"existing":[65],"reviews":[66],"on":[67,72,95],"generation":[69,125,197],"often":[70],"focus":[71],"narrow":[73],"technical":[74],"fields,":[75],"e.g.,":[76],"Generative":[77],"Adversarial":[78],"Networks":[79],"(GAN)":[80],"diffusion":[82,135],"models,":[83,136,214],"or":[84],"specific":[85],"tasks":[86],"(e.":[87],"g.,":[88],"editing),":[90],"lacking":[91],"a":[92,117],"comprehensive":[93],"perspective":[94],"field's":[97],"evolution,":[98],"especially":[99],"regarding":[100],"Auto-Regressive":[101],"(AR)":[102],"models":[103],"integration":[105,170],"multimodal":[107,143,165],"information.":[108],"To":[109],"address":[110],"these":[111],"gaps,":[112],"this":[113,187,216],"survey":[114,188],"firstly":[115],"provides":[116],"systematic":[118],"review":[119],"development":[122],"technology,":[126],"tracing":[127],"its":[128,199],"evolution":[129],"early":[131],"GANs":[132],"dominant":[134],"further":[138],"emerging":[140,162],"AR-based":[141],"techniques.":[144],"We":[145],"conduct":[146],"an":[147],"in-depth":[148],"analysis":[149],"foundational":[152],"principles,":[153],"key":[154],"advancements,":[155],"comparative":[157],"strengths/limitations.":[158],"Then,":[159],"we":[160],"explore":[161],"trends":[163],"in":[164,195,215],"emphasizing":[168],"diverse":[172],"data":[173],"types":[174],"enhance":[176],"contextual":[177],"awareness.":[178],"Finally,":[179],"by":[180],"bridging":[181],"historical":[182],"developments":[183],"contemporary":[185],"innovations,":[186],"offers":[189],"insights":[190],"guide":[192],"future":[193],"research":[194],"applications,":[200],"including":[201],"virtual/augmented":[202],"reality,":[203],"personalized":[204],"autonomous":[206],"driving":[207],"simulations,":[208],"digital":[209],"advanced":[212],"world":[213],"rapidly":[217],"evolving":[218],"field.":[219],"For":[220],"more":[221],"details,":[222],"please":[223],"refer":[224],"project":[227],"at":[228],"https://github.com/sjtuplayer/Awesome-Video-Foundations.":[229]},"counts_by_year":[],"updated_date":"2026-04-10T06:07:51.998497","created_date":"2026-04-10T00:00:00"}
