{"id":"https://openalex.org/W7148404073","doi":"https://doi.org/10.48550/arxiv.2604.01129","title":"ReinDriveGen: Reinforcement Post-Training for Out-of-Distribution Driving Scene Generation","display_name":"ReinDriveGen: Reinforcement Post-Training for Out-of-Distribution Driving Scene Generation","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148404073","doi":"https://doi.org/10.48550/arxiv.2604.01129"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01129","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01129","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01129","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132797780","display_name":"Hao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064754069","display_name":"Lue Fan","orcid":"https://orcid.org/0000-0002-2349-0538"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Lue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023250570","display_name":"Weikang Bian","orcid":"https://orcid.org/0000-0001-9986-3348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bian, Weikang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132810852","display_name":"Zehuan Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Zehuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132814030","display_name":"Lewei Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Lewei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132810469","display_name":"Zhaoxiang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhaoxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132790436","display_name":"Hongsheng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Hongsheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5132797780"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5037999749183655,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5037999749183655,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.10350000113248825,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.08990000188350677,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5645999908447266},{"id":"https://openalex.org/keywords/controllability","display_name":"Controllability","score":0.5616999864578247},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.4763000011444092},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.45719999074935913},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.41269999742507935},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.35519999265670776},{"id":"https://openalex.org/keywords/spinning","display_name":"Spinning","score":0.34220001101493835},{"id":"https://openalex.org/keywords/advanced-driver-assistance-systems","display_name":"Advanced driver assistance systems","score":0.3336000144481659}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7419999837875366},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6168000102043152},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5645999908447266},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.5616999864578247},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5597000122070312},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.4763000011444092},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.45719999074935913},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.41269999742507935},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.35519999265670776},{"id":"https://openalex.org/C154815118","wikidata":"https://www.wikidata.org/wiki/Q453762","display_name":"Spinning","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.3336000144481659},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.3156000077724457},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.30730000138282776},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.267300009727478},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2612999975681305}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01129","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01129","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01129","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01129","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"present":[1],"ReinDriveGen,":[2],"a":[3,46,57,80,107,112],"framework":[4],"that":[5,78,129],"enables":[6],"full":[7,63],"controllability":[8],"over":[9],"dynamic":[10,47],"driving":[11,87,136],"scenes,":[12],"allowing":[13],"users":[14],"to":[15,20,61,84],"freely":[16],"edit":[17],"actor":[18],"trajectories":[19],"simulate":[21],"safety-critical":[22],"corner":[23],"cases":[24],"such":[25,90],"as":[26],"front-vehicle":[27],"collisions,":[28],"drifting":[29],"cars,":[30],"vehicles":[31],"spinning":[32],"out":[33],"of":[34],"control,":[35],"pedestrians":[36],"jaywalking,":[37],"and":[38,69,111,138],"cyclists":[39],"cutting":[40],"across":[41],"lanes.":[42],"Our":[43],"approach":[44],"constructs":[45],"3D":[48],"point":[49],"cloud":[50],"scene":[51,73],"from":[52,66],"multi-frame":[53],"LiDAR":[54],"data,":[55],"introduces":[56],"vehicle":[58],"completion":[59],"module":[60],"reconstruct":[62],"360\u00b0":[64],"geometry":[65],"partial":[67],"observations,":[68],"renders":[70],"the":[71,96],"edited":[72,91,135],"into":[74],"2D":[75],"condition":[76],"images":[77],"guide":[79],"video":[81],"diffusion":[82],"model":[83,110],"synthesize":[85],"realistic":[86],"videos.":[88],"Since":[89],"scenarios":[92,137],"inevitably":[93],"fall":[94],"outside":[95],"training":[97],"distribution,":[98],"we":[99],"further":[100],"propose":[101],"an":[102],"RL-based":[103],"post-training":[104],"strategy":[105],"with":[106],"pairwise":[108,113],"preference":[109],"reward":[114],"mechanism,":[115],"enabling":[116],"robust":[117],"quality":[118],"improvement":[119],"under":[120],"out-of-distribution":[121],"conditions":[122],"without":[123],"ground-truth":[124],"supervision.":[125],"Extensive":[126],"experiments":[127],"demonstrate":[128],"ReinDriveGen":[130],"outperforms":[131],"existing":[132],"approaches":[133],"on":[134,142],"achieves":[139],"state-of-the-art":[140],"results":[141],"novel":[143],"ego":[144],"viewpoint":[145],"synthesis.":[146]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
