{"id":"https://openalex.org/W7158046705","doi":"https://doi.org/10.48550/arxiv.2604.25318","title":"Cutscene Agent: An LLM Agent Framework for Automated 3D Cutscene Generation","display_name":"Cutscene Agent: An LLM Agent Framework for Automated 3D Cutscene Generation","publication_year":2026,"publication_date":"2026-04-28","ids":{"openalex":"https://openalex.org/W7158046705","doi":"https://doi.org/10.48550/arxiv.2604.25318"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.25318","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25318","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.25318","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101238929","display_name":"Lanshan He","orcid":"https://orcid.org/0009-0009-6093-8803"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Lanshan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120307672","display_name":"Haozhou Pang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pang, Haozhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134858108","display_name":"Qi Gan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gan, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134830460","display_name":"Xin Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134861448","display_name":"Ziwei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ziwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134832084","display_name":"Yibo Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134830970","display_name":"Gang Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Gang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134862724","display_name":"Bo Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Bo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134827858","display_name":"Kai Sheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheng, Kai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134850961","display_name":"Shengfeng Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Shengfeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100617571","display_name":"Chaofan Li","orcid":"https://orcid.org/0000-0002-3041-3004"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chaofan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134823255","display_name":"Zhen Hui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hui, Zhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134831980","display_name":"Keer Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Keer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134827890","display_name":"Lan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Lan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134827282","display_name":"Shujun Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Shujun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":15,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.4535999894142151,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.4535999894142151,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.21789999306201935,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.06499999761581421,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6121000051498413},{"id":"https://openalex.org/keywords/orchestration","display_name":"Orchestration","score":0.5128999948501587},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5044999718666077},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4481000006198883},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4174000024795532},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.4081999957561493},{"id":"https://openalex.org/keywords/interdependence","display_name":"Interdependence","score":0.4074000120162964},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.4004000127315521},{"id":"https://openalex.org/keywords/dashboard","display_name":"Dashboard","score":0.35929998755455017},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.34950000047683716}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.748199999332428},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6121000051498413},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5139999985694885},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.5128999948501587},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5044999718666077},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4481000006198883},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4174000024795532},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.4081999957561493},{"id":"https://openalex.org/C185874996","wikidata":"https://www.wikidata.org/wiki/Q269699","display_name":"Interdependence","level":2,"score":0.4074000120162964},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.4004000127315521},{"id":"https://openalex.org/C33499554","wikidata":"https://www.wikidata.org/wiki/Q1417134","display_name":"Dashboard","level":2,"score":0.35929998755455017},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.34950000047683716},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.34790000319480896},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3400999903678894},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.3379000127315521},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.3269999921321869},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30809998512268066},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C2986528223","wikidata":"https://www.wikidata.org/wiki/Q193564","display_name":"Game engine","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.2987000048160553},{"id":"https://openalex.org/C22467394","wikidata":"https://www.wikidata.org/wiki/Q849359","display_name":"Multidisciplinary approach","level":2,"score":0.2939000129699707},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2890999913215637},{"id":"https://openalex.org/C2780554381","wikidata":"https://www.wikidata.org/wiki/Q2063340","display_name":"Sensemaking","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C153715457","wikidata":"https://www.wikidata.org/wiki/Q254183","display_name":"Augmented reality","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C2775945657","wikidata":"https://www.wikidata.org/wiki/Q381442","display_name":"Structuring","level":2,"score":0.25619998574256897},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.2554999887943268},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.25318","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25318","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.25318","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25318","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cutscenes":[0],"are":[1],"carefully":[2],"choreographed":[3],"cinematic":[4,123],"sequences":[5],"embedded":[6],"in":[7],"video":[8],"games":[9],"and":[10,23,42,100,138,151,204],"interactive":[11],"media,":[12],"serving":[13],"as":[14],"the":[15,88,101],"primary":[16],"vehicle":[17],"for":[18,73,135,148,157],"narrative":[19],"delivery,":[20],"character":[21,38],"development,":[22],"emotional":[24],"engagement.":[25],"Producing":[26],"cutscenes":[27],"is":[28],"inherently":[29],"complex:":[30],"it":[31],"demands":[32],"seamless":[33],"coordination":[34],"across":[35,208],"screenwriting,":[36],"cinematography,":[37,137],"animation,":[39,136],"voice":[40],"acting,":[41],"technical":[43],"direction,":[44],"often":[45],"requiring":[46],"days":[47],"to":[48,56],"weeks":[49],"of":[50,59,120,176,178,200],"collaborative":[51],"effort":[52],"from":[53],"multidisciplinary":[54],"teams":[55],"produce":[57],"minutes":[58],"polished":[60],"content.":[61],"In":[62],"this":[63,209],"work,":[64],"we":[65],"present":[66],"Cutscene":[67,84],"Agent,":[68],"an":[69],"LLM":[70,98],"agent":[71,131],"framework":[72,79],"automated":[74],"end-to-end":[75],"cutscene":[76,158,170],"generation.":[77,159],"The":[78],"makes":[80],"three":[81],"contributions:":[82],"(1)~a":[83],"Toolkit":[85],"built":[86],"on":[87,202],"Model":[89],"Context":[90],"Protocol":[91],"(MCP)":[92],"that":[93,164,190],"establishes":[94],"\\emph{bidirectional}":[95],"integration":[96],"between":[97],"agents":[99,105],"game":[102],"engine":[103,109],"--":[104,186],"not":[106,194],"only":[107],"invoke":[108],"operations":[110],"but":[111],"continuously":[112],"observe":[113],"real-time":[114],"scene":[115],"state,":[116],"enabling":[117],"closed-loop":[118],"generation":[119,171],"editable":[121],"engine-native":[122],"assets;":[124],"(2)~a":[125],"multi-agent":[126],"system":[127],"where":[128],"a":[129,143,153,187,198],"director":[130],"orchestrates":[132],"specialist":[133],"subagents":[134],"sound":[139],"design,":[140],"augmented":[141],"by":[142],"visual":[144],"reasoning":[145],"feedback":[146],"loop":[147],"perception-driven":[149],"refinement;":[150],"(3)~CutsceneBench,":[152],"hierarchical":[154],"evaluation":[155],"benchmark":[156],"Unlike":[160],"typical":[161],"tool-use":[162],"benchmarks":[163,192],"evaluate":[165,197],"short,":[166],"isolated":[167],"function":[168],"calls,":[169],"requires":[172],"long-horizon,":[173],"multi-step":[174],"orchestration":[175],"dozens":[177],"interdependent":[179],"tool":[180],"invocations":[181],"with":[182],"strict":[183],"ordering":[184],"constraints":[185],"capability":[188],"dimension":[189],"existing":[191],"do":[193],"cover.":[195],"We":[196],"range":[199],"LLMs":[201],"CutsceneBench":[203],"analyze":[205],"their":[206],"performance":[207],"challenging":[210],"task.":[211]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-30T00:00:00"}
