{"id":"https://openalex.org/W7134836873","doi":"https://doi.org/10.48550/arxiv.2603.08403","title":"SPIRAL: A Closed-Loop Framework for Self-Improving Action World Models via Reflective Planning Agents","display_name":"SPIRAL: A Closed-Loop Framework for Self-Improving Action World Models via Reflective Planning Agents","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134836873","doi":"https://doi.org/10.48550/arxiv.2603.08403"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.08403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.08403","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128643554","display_name":"Yu Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128663857","display_name":"Yue Liao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074067442","display_name":"Jianbiao Mei","orcid":"https://orcid.org/0000-0003-3849-2736"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mei, Jianbiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128650044","display_name":"Baisen Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Baisen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101138291","display_name":"Xuemeng Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xuemeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056126166","display_name":"Licheng Wen","orcid":"https://orcid.org/0000-0003-2707-3165"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Licheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128675836","display_name":"Jiangning Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiangning","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128649765","display_name":"Xiangtai Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiangtai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101979344","display_name":"Hanlin Chen","orcid":"https://orcid.org/0000-0001-6508-7715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hanlin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123005194","display_name":"Botian Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Botian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128642076","display_name":"Yong Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128641753","display_name":"Shuicheng Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Shuicheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128662855","display_name":"Gim Hee Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Gim Hee","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5128643554"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.2329999953508377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.2329999953508377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1745000034570694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1573999971151352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5609999895095825},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5479999780654907},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.38109999895095825},{"id":"https://openalex.org/keywords/automated-planning-and-scheduling","display_name":"Automated planning and scheduling","score":0.3407999873161316},{"id":"https://openalex.org/keywords/iterative-learning-control","display_name":"Iterative learning control","score":0.32690000534057617},{"id":"https://openalex.org/keywords/mainstream","display_name":"Mainstream","score":0.3231000006198883}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7487999796867371},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5609999895095825},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5479999780654907},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44190001487731934},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C114073186","wikidata":"https://www.wikidata.org/wiki/Q2631895","display_name":"Automated planning and scheduling","level":2,"score":0.3407999873161316},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.32690000534057617},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.3231000006198883},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C2779982483","wikidata":"https://www.wikidata.org/wiki/Q6094420","display_name":"Iterative refinement","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C143587482","wikidata":"https://www.wikidata.org/wiki/Q1543216","display_name":"Iterative and incremental development","level":2,"score":0.29249998927116394},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2915000021457672},{"id":"https://openalex.org/C174128100","wikidata":"https://www.wikidata.org/wiki/Q846907","display_name":"Spiral (railway)","level":2,"score":0.2741999924182892}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.08403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.08403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.6558626294136047,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,102],"introduce":[1,104],"SPIRAL,":[2],"a":[3,49,73],"self-improving":[4],"planning":[5,61],"and":[6,42,62,78,96,107,111,123],"iterative":[7,80],"reflective":[8],"action":[9,37],"world":[10],"modeling":[11],"closed-loop":[12,50,86],"framework":[13],"that":[14],"enables":[15],"controllable":[16],"long-horizon":[17,83],"video":[18,27,125],"generation":[19,28,54,126],"conditioned":[20],"on":[21,121],"high-level":[22],"semantic":[23,40,94],"actions.":[24],"Existing":[25],"one-shot":[26],"models":[29],"operate":[30],"in":[31,35],"open-loop,":[32],"often":[33],"resulting":[34],"incomplete":[36],"execution,":[38],"weak":[39],"grounding,":[41],"temporal":[43,97],"drift.":[44],"SPIRAL":[45],"formulates":[46],"ActWM":[47],"as":[48],"think-act-reflect":[51],"process,":[52],"where":[53],"proceeds":[55],"step":[56,58],"by":[57],"under":[59],"explicit":[60],"feedback.":[63],"A":[64],"PlanAgent":[65],"decomposes":[66],"abstract":[67],"actions":[68],"into":[69],"object-centric":[70],"sub-actions,":[71],"while":[72],"CriticAgent":[74],"evaluates":[75],"intermediate":[76],"results":[77],"guides":[79],"refinement":[81],"with":[82],"memory.":[84],"This":[85],"design":[87],"naturally":[88],"supports":[89],"RL":[90],"evolving":[91],"optimization,":[92],"improving":[93],"alignment":[95],"consistency":[98],"over":[99],"extended":[100],"horizons.":[101],"further":[103],"the":[105],"ActWM-Dataset":[106],"ActWM-Bench":[108,122],"for":[109],"training":[110],"evaluation.":[112],"Experiments":[113],"across":[114],"multiple":[115],"TI2V":[116],"backbones":[117],"demonstrate":[118],"consistent":[119],"gains":[120],"mainstream":[124],"benchmarks,":[127],"validating":[128],"SPIRAL's":[129],"effectiveness.":[130]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-11T00:00:00"}
