{"id":"https://openalex.org/W7155159077","doi":"https://doi.org/10.48550/arxiv.2604.19257","title":"Unposed-to-3D: Learning Simulation-Ready Vehicles from Real-World Images","display_name":"Unposed-to-3D: Learning Simulation-Ready Vehicles from Real-World Images","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155159077","doi":"https://doi.org/10.48550/arxiv.2604.19257"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19257","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134281198","display_name":"Hongyuan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Hongyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045750357","display_name":"Bochao Zou","orcid":"https://orcid.org/0000-0002-2126-8159"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Bochao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134243829","display_name":"Qiankun Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Qiankun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134352696","display_name":"Haochen Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Haochen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102137095","display_name":"Qi Mei","orcid":"https://orcid.org/0009-0007-4697-1418"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mei, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134319256","display_name":"Jianfei Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jianfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134321360","display_name":"Chen Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134238178","display_name":"Cheng Bi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bi, Cheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134244855","display_name":"Zhao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134293003","display_name":"Xueyang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xueyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120696887","display_name":"Yifei Zhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhan, Yifei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134236277","display_name":"Jiansheng Chen","orcid":"https://orcid.org/0000-0002-2040-7938"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiansheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5006236325","display_name":"Huimin Ma","orcid":"https://orcid.org/0000-0001-5383-5667"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Huimin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3677999973297119,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3677999973297119,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.18559999763965607,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.14399999380111694,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.646399974822998},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.45890000462532043},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.40950000286102295},{"id":"https://openalex.org/keywords/view-synthesis","display_name":"View synthesis","score":0.3824000060558319},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.3709000051021576},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.3553999960422516},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.35359999537467957},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3481000065803528},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.3370000123977661}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6990000009536743},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6973000168800354},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6940000057220459},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.646399974822998},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.45890000462532043},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.40950000286102295},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.3824000060558319},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3813000023365021},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3709000051021576},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.3553999960422516},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.3370000123977661},{"id":"https://openalex.org/C109950114","wikidata":"https://www.wikidata.org/wiki/Q4464732","display_name":"3D reconstruction","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.32120001316070557},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C23903533","wikidata":"https://www.wikidata.org/wiki/Q17122739","display_name":"Reprojection error","level":3,"score":0.31200000643730164},{"id":"https://openalex.org/C2776863239","wikidata":"https://www.wikidata.org/wiki/Q7936601","display_name":"Visual hull","level":3,"score":0.3116999864578247},{"id":"https://openalex.org/C2778597888","wikidata":"https://www.wikidata.org/wiki/Q172169","display_name":"3D city models","level":3,"score":0.30880001187324524},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C110898773","wikidata":"https://www.wikidata.org/wiki/Q2933935","display_name":"Camera resectioning","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C181672929","wikidata":"https://www.wikidata.org/wiki/Q4115141","display_name":"Digital mapping","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C2987571089","wikidata":"https://www.wikidata.org/wiki/Q738160","display_name":"Multi camera","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C77660652","wikidata":"https://www.wikidata.org/wiki/Q150971","display_name":"Computer graphics","level":2,"score":0.25769999623298645}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Creating":[0],"realistic":[1],"and":[2,12,42,108,163,180,191,211],"simulation-ready":[3],"3D":[4,18,68,142,193],"assets":[5,206],"is":[6,126],"crucial":[7],"for":[8,129,207],"autonomous":[9],"driving":[10,53,72,175,208],"research":[11],"virtual":[13],"environment":[14],"construction.":[15],"However,":[16],"existing":[17],"vehicle":[19,194],"generation":[20],"methods":[21],"are":[22],"often":[23,38],"trained":[24],"on":[25],"synthetic":[26],"data":[27],"with":[28,96,177],"significant":[29],"domain":[30],"gaps":[31],"from":[32,70,120,145,196],"real-world":[33,71,160,197],"distributions.":[34],"The":[35,123],"generated":[36,170],"models":[37,195],"exhibit":[39],"arbitrary":[40],"poses":[41],"undefined":[43],"scales,":[44],"resulting":[45],"in":[46],"poor":[47],"visual":[48],"consistency":[49],"when":[50],"integrated":[51],"into":[52],"scenes.":[54],"In":[55,83,100],"this":[56],"paper,":[57],"we":[58,87,104,152],"present":[59],"Unposed-to-3D,":[60],"a":[61,110,155,164,200],"novel":[62],"framework":[63],"that":[64,114,167,185],"learns":[65],"to":[66,132,140,158,172],"reconstruct":[67],"vehicles":[69,171],"images":[73,95],"using":[74,93],"image-only":[75],"supervision.":[76],"Our":[77],"approach":[78],"consists":[79],"of":[80],"two":[81],"stages.":[82],"the":[84,101,117,138,169,173],"first":[85],"stage,":[86,103],"train":[88],"an":[89],"image-to-3D":[90],"reconstruction":[91],"network":[92],"posed":[94],"known":[97],"camera":[98,106,111,118],"parameters.":[99],"second":[102],"remove":[105],"supervision":[107],"use":[109],"prediction":[112],"head":[113],"directly":[115],"estimates":[116],"parameters":[119],"unposed":[121,146],"images.":[122,147],"predicted":[124],"pose":[125],"then":[127],"used":[128],"differentiable":[130],"rendering":[131],"provide":[133],"self-supervised":[134],"photometric":[135],"feedback,":[136],"enabling":[137],"model":[139],"learn":[141],"geometry":[143],"purely":[144],"To":[148],"ensure":[149],"simulation":[150,210],"readiness,":[151],"further":[153],"introduce":[154],"scale-aware":[156],"module":[157,166],"predict":[159],"size":[161],"information,":[162],"harmonization":[165],"adapts":[168],"target":[174],"scene":[176,209],"consistent":[178],"lighting":[179],"appearance.":[181],"Extensive":[182],"experiments":[183],"demonstrate":[184],"Unposed-to-3D":[186],"effectively":[187],"reconstructs":[188],"realistic,":[189],"pose-consistent,":[190],"harmonized":[192],"images,":[198],"providing":[199],"scalable":[201],"path":[202],"toward":[203],"creating":[204],"high-quality":[205],"digital":[212],"twin":[213],"environments.":[214]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-23T00:00:00"}
