{"id":"https://openalex.org/W4413917947","doi":"https://doi.org/10.1109/icra55743.2025.11127463","title":"DreamDrive: Generative 4D Scene Modeling from Street View Images","display_name":"DreamDrive: Generative 4D Scene Modeling from Street View Images","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413917947","doi":"https://doi.org/10.1109/icra55743.2025.11127463"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11127463","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087884932","display_name":"Jiageng Mao","orcid":"https://orcid.org/0000-0003-2571-8767"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Jiageng Mao","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114686206","display_name":"Boyi Li","orcid":"https://orcid.org/0000-0002-6752-3223"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Boyi Li","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091869385","display_name":"Boris Ivanovic","orcid":"https://orcid.org/0000-0002-8698-202X"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Boris Ivanovic","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100366786","display_name":"Yuxiao Chen","orcid":"https://orcid.org/0000-0001-5276-7156"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yuxiao Chen","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101905406","display_name":"Yan Wang","orcid":"https://orcid.org/0000-0002-0322-8479"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yan Wang","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069174793","display_name":"Yurong You","orcid":"https://orcid.org/0000-0002-6898-9463"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yurong You","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005843046","display_name":"Chaowei Xiao","orcid":"https://orcid.org/0000-0002-7043-4926"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chaowei Xiao","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028834865","display_name":"Danfei Xu","orcid":"https://orcid.org/0000-0002-8744-3861"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Danfei Xu","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050003000","display_name":"Marco Pavone","orcid":"https://orcid.org/0000-0002-0206-4337"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marco Pavone","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100371992","display_name":"Yue Wang","orcid":"https://orcid.org/0000-0002-0981-935X"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yue Wang","raw_affiliation_strings":["NVIDIA Research"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research","institution_ids":["https://openalex.org/I1304085615"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5087884932"],"corresponding_institution_ids":["https://openalex.org/I1304085615"],"apc_list":null,"apc_paid":null,"fwci":0.9029,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.77362522,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"367","last_page":"374"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12698","display_name":"3D Modeling in Geospatial Applications","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9769999980926514,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7133147716522217},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6430501937866211},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.574389636516571},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5366697907447815},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.47894173860549927},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.37332969903945923}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7133147716522217},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6430501937866211},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.574389636516571},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5366697907447815},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.47894173860549927},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.37332969903945923}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11127463","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W134642456","https://openalex.org/W2471962767","https://openalex.org/W2562637781","https://openalex.org/W2968008415","https://openalex.org/W3035172746","https://openalex.org/W3035574168","https://openalex.org/W3153220274","https://openalex.org/W3174177541","https://openalex.org/W3183092879","https://openalex.org/W4200150166","https://openalex.org/W4312396550","https://openalex.org/W4312580801","https://openalex.org/W4312641958","https://openalex.org/W4312933868","https://openalex.org/W4385318467","https://openalex.org/W4386076007","https://openalex.org/W4386076371","https://openalex.org/W4386076400","https://openalex.org/W4386076483","https://openalex.org/W4390872423","https://openalex.org/W4390873331","https://openalex.org/W4391516317","https://openalex.org/W4392016505","https://openalex.org/W4402713101","https://openalex.org/W4402716105","https://openalex.org/W4402716256","https://openalex.org/W4402727067","https://openalex.org/W4402727269","https://openalex.org/W4402754077","https://openalex.org/W4402754225","https://openalex.org/W4402778069","https://openalex.org/W4402816534","https://openalex.org/W4402951629","https://openalex.org/W4402952317","https://openalex.org/W4404601281","https://openalex.org/W4404722496","https://openalex.org/W4408955770","https://openalex.org/W4413558925"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Synthesizing":[0],"photo-realistic":[1],"visual":[2,74,124],"observations":[3],"from":[4,25,164,175],"an":[5],"ego":[6],"vehicle's":[7],"driving":[8,26,31,50,61,100,104,140,146,166,185,196,202],"trajectory":[9],"is":[10],"a":[11,64,82,121,133,139,216],"critical":[12],"step":[13],"towards":[14],"scalable":[15],"training":[16],"of":[17,92,115,123,153,201],"self-driving":[18],"models.":[19],"Reconstruction-based":[20],"methods":[21],"create":[22],"3D":[23,73,107,208],"scenes":[24,101,163],"logs":[27],"and":[28,94,102,126,183,193,207,212,219,222],"synthesize":[29,59,97,120,198],"geometry-consistent":[30],"videos":[32,62,105,147,203],"through":[33],"neural":[34,169],"rendering,":[35],"but":[36,68],"their":[37,44],"dependence":[38],"on":[39,181],"costly":[40],"object":[41],"annotations":[42],"limits":[43],"ability":[45],"to":[46,48,96,119,130,159],"generalize":[47],"in-the-wild":[49,165,184],"scenarios.":[51],"On":[52],"the":[53,90,112,176],"other":[54],"hand,":[55],"generative":[56,113,154],"models":[57,118],"can":[58,190],"action-conditioned":[60],"in":[63,215],"more":[65],"generalizable":[66,98,194],"way":[67],"often":[69],"struggle":[70],"with":[71,106,132,204],"maintaining":[72],"consistency.":[75,108],"In":[76],"this":[77],"paper,":[78],"we":[79,110,142],"present":[80],"DreamDrive,":[81],"4D":[83,99,131,162,177,195],"spatial-temporal":[84],"scene":[85],"generation":[86,93,174],"approach":[87],"that":[88,188],"combines":[89],"merits":[91],"reconstruction,":[95],"dynamic":[103,213],"Specifically,":[109],"leverage":[111],"power":[114],"video":[116,173],"diffusion":[117],"sequence":[122],"references":[125],"further":[127],"elevate":[128],"them":[129],"novel":[134,199],"hybrid":[135],"Gaussian":[136,149],"representation.":[137],"Given":[138],"trajectory,":[141],"then":[143],"render":[144],"3D-consistent":[145,172],"via":[148],"splatting.":[150],"The":[151],"use":[152],"priors":[155],"allows":[156],"our":[157],"method":[158],"produce":[160],"high-quality":[161],"data,":[167],"while":[168],"rendering":[170],"ensures":[171],"scenes.":[178],"Extensive":[179],"experiments":[180],"nuScenes":[182],"data":[186],"demonstrate":[187],"DreamDrive":[189],"generate":[191],"controllable":[192],"scenes,":[197],"views":[200],"high":[205],"fidelity":[206],"consistency,":[209],"decompose":[210],"static":[211],"elements":[214],"self-supervised":[217],"manner,":[218],"enhance":[220],"perception":[221],"planning":[223],"tasks":[224],"for":[225],"autonomous":[226],"driving.":[227]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
