{"id":"https://openalex.org/W7131375111","doi":"https://doi.org/10.48550/arxiv.2602.19766","title":"One2Scene: Geometric Consistent Explorable 3D Scene Generation from a Single Image","display_name":"One2Scene: Geometric Consistent Explorable 3D Scene Generation from a Single Image","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131375111","doi":"https://doi.org/10.48550/arxiv.2602.19766"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19766","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126825268","display_name":"Pengfei Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Pengfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004719638","display_name":"Chen Li-yi","orcid":"https://orcid.org/0000-0001-6600-5064"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Liyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126805333","display_name":"Zhiyuan Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Zhiyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126799308","display_name":"Yanjun Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yanjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126818092","display_name":"Guowen Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Guowen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126811730","display_name":"Lei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5126825268"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9574999809265137,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9574999809265137,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.013700000010430813,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.010499999858438969,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/panorama","display_name":"Panorama","score":0.8945000171661377},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.597599983215332},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.5353000164031982},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5133000016212463},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.43959999084472656},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.3804999887943268},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.37610000371932983},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.33730000257492065}],"concepts":[{"id":"https://openalex.org/C2780580889","wikidata":"https://www.wikidata.org/wiki/Q41363","display_name":"Panorama","level":2,"score":0.8945000171661377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7534999847412109},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7477999925613403},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7125999927520752},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.597599983215332},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.5353000164031982},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5133000016212463},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.43959999084472656},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3804999887943268},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.37610000371932983},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.33730000257492065},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.33090001344680786},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C2987632653","wikidata":"https://www.wikidata.org/wiki/Q7611220","display_name":"Stereo image","level":3,"score":0.3190000057220459},{"id":"https://openalex.org/C109950114","wikidata":"https://www.wikidata.org/wiki/Q4464732","display_name":"3D reconstruction","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27720001339912415},{"id":"https://openalex.org/C136520226","wikidata":"https://www.wikidata.org/wiki/Q302814","display_name":"Geometric data analysis","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C166704113","wikidata":"https://www.wikidata.org/wiki/Q861092","display_name":"Image registration","level":3,"score":0.2648000121116638},{"id":"https://openalex.org/C32990609","wikidata":"https://www.wikidata.org/wiki/Q306542","display_name":"Transformation geometry","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generating":[0],"explorable":[1,58,217],"3D":[2,14,87,218],"scenes":[3],"from":[4,36,71,134],"a":[5,9,64,72,91,103,161,165,183],"single":[6,73,104],"image":[7,75,105],"is":[8,143],"highly":[10],"challenging":[11],"problem":[12,50],"in":[13,209],"vision.":[15],"Existing":[16],"methods":[17,208],"struggle":[18],"to":[19,55,67,128,145,169,186],"support":[20],"free":[21],"exploration,":[22],"often":[23],"producing":[24],"severe":[25],"geometric":[26,88,131],"distortions":[27],"and":[28,116,152,172,216],"noisy":[29],"artifacts":[30],"when":[31],"the":[32,37,100,118,157],"viewpoint":[33],"moves":[34],"far":[35],"original":[38],"perspective.":[39],"We":[40,61],"introduce":[41],"\\textbf{One2Scene},":[42],"an":[43,85,150],"effective":[44],"framework":[45],"that":[46,203],"decomposes":[47],"this":[48],"ill-posed":[49],"into":[51,84,111],"three":[52],"tractable":[53],"sub-tasks":[54],"enable":[56],"immersive":[57,197],"scene":[59,198,219],"generation.":[60,220],"first":[62],"use":[63],"panorama":[65,101,210],"generator":[66,168],"produce":[68,170],"anchor":[69,114],"views":[70,115,175],"input":[74],"as":[76,102,121,160],"initialization.":[77],"Then,":[78],"we":[79,108],"lift":[80],"these":[81],"2D":[82],"anchors":[83],"explicit":[86],"scaffold":[89,158,185],"via":[90],"generalizable,":[92],"feed-forward":[93,213],"Gaussian":[94],"Splatting":[95],"network.":[96],"Instead":[97],"of":[98],"treating":[99],"for":[106,164],"reconstruction,":[107,188,215],"project":[109],"it":[110],"multiple":[112],"sparse":[113],"reformulate":[117],"reconstruction":[119],"task":[120],"multi-view":[122,136],"stereo":[123],"matching,":[124],"which":[125],"allows":[126],"us":[127],"leverage":[129],"robust":[130],"priors":[132],"learned":[133],"large-scale":[135],"datasets.":[137],"A":[138],"bidirectional":[139],"feature":[140],"fusion":[141],"module":[142],"used":[144],"enforce":[146],"cross-view":[147],"consistency,":[148],"yielding":[149],"efficient":[151],"geometrically":[153,173],"reliable":[154],"scaffold.":[155],"Finally,":[156],"serves":[159],"strong":[162],"prior":[163],"novel":[166],"view":[167],"photorealistic":[171],"accurate":[174],"at":[176],"arbitrary":[177],"cameras.":[178],"By":[179],"explicitly":[180],"conditioning":[181],"on":[182],"3D-consistent":[184],"perform":[187],"One2Scene":[189,204],"works":[190],"stably":[191],"under":[192],"large":[193],"camera":[194],"motions,":[195],"supporting":[196],"exploration.":[199],"Extensive":[200],"experiments":[201],"show":[202],"substantially":[205],"outperforms":[206],"state-of-the-art":[207],"depth":[211],"estimation,":[212],"360\u00b0":[214],"Project":[221],"page:":[222],"https://one2scene5406.github.io/":[223]},"counts_by_year":[],"updated_date":"2026-03-03T06:13:14.889584","created_date":"2026-02-26T00:00:00"}
