{"id":"https://openalex.org/W7138195537","doi":"https://doi.org/10.48550/arxiv.2603.15583","title":"Grounding World Simulation Models in a Real-World Metropolis","display_name":"Grounding World Simulation Models in a Real-World Metropolis","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138195537","doi":"https://doi.org/10.48550/arxiv.2603.15583"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15583","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129660664","display_name":"Junyoung Seo","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Seo, Junyoung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019261810","display_name":"H. R. Choi","orcid":"https://orcid.org/0009-0006-4819-6040"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Hyunwook","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129665405","display_name":"Minkyung Kwon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, Minkyung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129653755","display_name":"Jinhyeok Choi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Jinhyeok","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102637406","display_name":"Siyoon Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Siyoon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129667830","display_name":"Gayoung Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Gayoung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129729673","display_name":"Junho Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Junho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129648998","display_name":"JoungBin Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, JoungBin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102375302","display_name":"Geonmo Gu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Geonmo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129647929","display_name":"Dongyoon Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Dongyoon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129673130","display_name":"Sangdoo Yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yun, Sangdoo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129643639","display_name":"Seungryong Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Seungryong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129680957","display_name":"Jin-Hwa Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Jin-Hwa","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5129660664"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6132000088691711,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6132000088691711,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.10369999706745148,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.04659999907016754,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.4645000100135803},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.4447000026702881},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.4066999852657318},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4059999883174896},{"id":"https://openalex.org/keywords/real-world-data","display_name":"Real world data","score":0.39579999446868896},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.3693999946117401}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7229999899864197},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5266000032424927},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.4645000100135803},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.4447000026702881},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4221000075340271},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.4066999852657318},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4059999883174896},{"id":"https://openalex.org/C3020493868","wikidata":"https://www.wikidata.org/wiki/Q55631277","display_name":"Real world data","level":2,"score":0.39579999446868896},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3693999946117401},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.36079999804496765},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3296999931335449},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.31540000438690186},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3046000003814697},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.263700008392334}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8212578892707825,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"What":[0],"if":[1],"a":[2,13,38,97,106,122,136,140],"world":[3,20,40,149],"simulation":[4],"model":[5,41],"could":[6],"render":[7],"not":[8],"an":[9],"imagined":[10],"environment":[11],"but":[12],"city":[14,46],"that":[15,110],"actually":[16],"exists?":[17],"Prior":[18],"generative":[19],"models":[21,150],"synthesize":[22],"visually":[23],"plausible":[24],"yet":[25],"artificial":[26],"environments":[27,175],"by":[28,130],"imagining":[29],"all":[30],"content.":[31],"We":[32,90,119,143],"present":[33],"Seoul":[34],"World":[35],"Model":[36],"(SWM),":[37],"city-scale":[39],"grounded":[42,171],"in":[43,163,172],"the":[44,74],"real":[45],"of":[47,180],"Seoul.":[48],"SWM":[49,145,159],"anchors":[50],"autoregressive":[51],"video":[52,148],"generation":[53,129],"through":[54,94],"retrieval-augmented":[55],"conditioning":[56],"on":[57],"nearby":[58],"street-view":[59,117],"images.":[60,118],"However,":[61],"this":[62],"design":[63],"introduces":[64],"several":[65],"challenges,":[66],"including":[67],"temporal":[68],"misalignment":[69],"between":[70],"retrieved":[71,137],"references":[72],"and":[73,81,105,156,187],"dynamic":[75],"target":[76],"scene,":[77],"limited":[78],"trajectory":[79],"diversity":[80],"data":[82],"sparsity":[83],"from":[84,115],"vehicle-mounted":[85],"captures":[86],"at":[87,139],"sparse":[88,116],"intervals.":[89],"address":[91],"these":[92],"challenges":[93],"cross-temporal":[95],"pairing,":[96],"large-scale":[98],"synthetic":[99],"dataset":[100],"enabling":[101],"diverse":[102,184],"camera":[103,185],"trajectories,":[104],"view":[107],"interpolation":[108],"pipeline":[109],"synthesizes":[111],"coherent":[112],"training":[113],"videos":[114,170],"further":[120],"introduce":[121],"Virtual":[123],"Lookahead":[124],"Sink":[125],"to":[126,135],"stabilize":[127],"long-horizon":[128,169],"continuously":[131],"re-grounding":[132],"each":[133],"chunk":[134],"image":[138],"future":[141],"location.":[142],"evaluate":[144],"against":[146],"recent":[147],"across":[151],"three":[152],"cities:":[153],"Seoul,":[154],"Busan,":[155],"Ann":[157],"Arbor.":[158],"outperforms":[160],"existing":[161],"methods":[162],"generating":[164],"spatially":[165],"faithful,":[166],"temporally":[167],"consistent,":[168],"actual":[173],"urban":[174],"over":[176],"trajectories":[177],"reaching":[178],"hundreds":[179],"meters,":[181],"while":[182],"supporting":[183],"movements":[186],"text-prompted":[188],"scenario":[189],"variations.":[190]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
