{"id":"https://openalex.org/W7140175890","doi":"https://doi.org/10.48550/arxiv.2603.22275","title":"Repurposing Geometric Foundation Models for Multi-view Diffusion","display_name":"Repurposing Geometric Foundation Models for Multi-view Diffusion","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140175890","doi":"https://doi.org/10.48550/arxiv.2603.22275"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22275","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jang, Wooseok","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jang, Wooseok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jeon, Seonghu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeon, Seonghu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Han, Jisang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Jisang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Choi, Jinhyeok","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Jinhyeok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kwon, Minkyung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, Minkyung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kim, Seungryong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Seungryong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xie, Saining","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Saining","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Liu, Sainan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Sainan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7853000164031982,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7853000164031982,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.08699999749660492,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.05260000005364418,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5008999705314636},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.4726000130176544},{"id":"https://openalex.org/keywords/repurposing","display_name":"Repurposing","score":0.45080000162124634},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.44269999861717224},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4293999969959259},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.42809998989105225},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.423799991607666}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5784000158309937},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5044999718666077},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5008999705314636},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.4726000130176544},{"id":"https://openalex.org/C519536355","wikidata":"https://www.wikidata.org/wiki/Q21021151","display_name":"Repurposing","level":2,"score":0.45080000162124634},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.44269999861717224},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4293999969959259},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.42809998989105225},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.423799991607666},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32120001316070557},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.29420000314712524},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C65965080","wikidata":"https://www.wikidata.org/wiki/Q1806885","display_name":"Latent variable model","level":3,"score":0.257099986076355},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2551000118255615},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"recent":[1],"advances":[2],"in":[3,11,40],"generative":[4,152],"latent":[5,16,44,70,96,129],"spaces":[6],"have":[7],"driven":[8],"substantial":[9],"progress":[10],"single-image":[12],"generation,":[13],"the":[14,59,69,127],"optimal":[15],"space":[17,63,71,97],"for":[18,72,98],"novel":[19],"view":[20],"synthesis":[21],"(NVS)":[22],"remains":[23,133],"largely":[24],"unexplored.":[25],"In":[26,46],"particular,":[27],"NVS":[28],"requires":[29],"geometrically":[30,60],"consistent":[31,61],"generation":[32],"across":[33],"viewpoints,":[34],"but":[35,86],"existing":[36],"approaches":[37],"typically":[38],"operate":[39],"a":[41,55,94],"view-independent":[42],"VAE":[43,107,128],"space.":[45,130],"this":[47],"paper,":[48],"we":[49],"propose":[50],"Geometric":[51],"Latent":[52],"Diffusion":[53],"(GLD),":[54],"framework":[56],"that":[57,77,103,138],"repurposes":[58],"feature":[62],"of":[64],"geometric":[65,91],"foundation":[66],"models":[67],"as":[68],"multi-view":[73],"diffusion.":[74],"We":[75],"show":[76],"these":[78],"features":[79],"not":[80],"only":[81],"support":[82],"high-fidelity":[83],"RGB":[84],"reconstruction":[85],"also":[87],"encode":[88],"strong":[89],"cross-view":[90],"correspondences,":[92],"providing":[93],"well-suited":[95],"NVS.":[99],"Our":[100],"experiments":[101],"demonstrate":[102],"GLD":[104,132],"outperforms":[105],"both":[106],"and":[108,114],"RAE":[109],"on":[110],"2D":[111],"image":[112],"quality":[113],"3D":[115],"consistency":[116],"metrics,":[117],"while":[118],"accelerating":[119],"training":[120,144],"by":[121],"more":[122],"than":[123],"4.4x":[124],"compared":[125],"to":[126],"Notably,":[131],"competitive":[134],"with":[135],"state-of-the-art":[136],"methods":[137],"leverage":[139],"large-scale":[140],"text-to-image":[141],"pretraining,":[142],"despite":[143],"its":[145],"diffusion":[146],"model":[147],"from":[148],"scratch":[149],"without":[150],"such":[151],"pretraining.":[153]},"counts_by_year":[],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2026-03-25T00:00:00"}
