{"id":"https://openalex.org/W7118684197","doi":"https://doi.org/10.48550/arxiv.2601.00368","title":"Mask-Conditioned Voxel Diffusion for Joint Geometry and Color Inpainting","display_name":"Mask-Conditioned Voxel Diffusion for Joint Geometry and Color Inpainting","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7118684197","doi":"https://doi.org/10.48550/arxiv.2601.00368"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.00368","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114539415","display_name":"Aarya Sumuk","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sumuk, Aarya","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5114539415"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5482000112533569,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5482000112533569,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.2198999971151352,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.06689999997615814,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inpainting","display_name":"Inpainting","score":0.8255000114440918},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6955000162124634},{"id":"https://openalex.org/keywords/voxel","display_name":"Voxel","score":0.6341000199317932},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.6011999845504761},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5259000062942505},{"id":"https://openalex.org/keywords/complex-geometry","display_name":"Complex geometry","score":0.4447000026702881},{"id":"https://openalex.org/keywords/color-difference","display_name":"Color difference","score":0.4043999910354614},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.3840999901294708},{"id":"https://openalex.org/keywords/color-image","display_name":"Color image","score":0.37389999628067017}],"concepts":[{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.8255000114440918},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7527999877929688},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7294999957084656},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6955000162124634},{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.6341000199317932},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.6011999845504761},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5386000275611877},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5259000062942505},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.4666000008583069},{"id":"https://openalex.org/C158843486","wikidata":"https://www.wikidata.org/wiki/Q2137810","display_name":"Complex geometry","level":2,"score":0.4447000026702881},{"id":"https://openalex.org/C186991048","wikidata":"https://www.wikidata.org/wiki/Q1184883","display_name":"Color difference","level":3,"score":0.4043999910354614},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.3840999901294708},{"id":"https://openalex.org/C142616399","wikidata":"https://www.wikidata.org/wiki/Q5148604","display_name":"Color image","level":4,"score":0.37389999628067017},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.365200012922287},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C109950114","wikidata":"https://www.wikidata.org/wiki/Q4464732","display_name":"3D reconstruction","level":2,"score":0.32409998774528503},{"id":"https://openalex.org/C187888035","wikidata":"https://www.wikidata.org/wiki/Q2563885","display_name":"Color constancy","level":3,"score":0.2962999939918518},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29019999504089355},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.28940001130104065},{"id":"https://openalex.org/C2961294","wikidata":"https://www.wikidata.org/wiki/Q166863","display_name":"Color space","level":3,"score":0.27230000495910645},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2653999924659729},{"id":"https://openalex.org/C153008295","wikidata":"https://www.wikidata.org/wiki/Q6535093","display_name":"Level set (data structures)","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C159784718","wikidata":"https://www.wikidata.org/wiki/Q182571","display_name":"Color balance","level":5,"score":0.2583000063896179},{"id":"https://openalex.org/C12043971","wikidata":"https://www.wikidata.org/wiki/Q2636542","display_name":"Color histogram","level":5,"score":0.25760000944137573},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.2554999887943268},{"id":"https://openalex.org/C36262787","wikidata":"https://www.wikidata.org/wiki/Q2294018","display_name":"Color model","level":4,"score":0.2554999887943268}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.8315178155899048,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,105],"present":[1],"a":[2,36,48,57,64,91,110,142,155],"lightweight":[3],"two-stage":[4],"framework":[5],"for":[6,163],"joint":[7,164],"geometry":[8,76,135,166],"and":[9,51,77,88,102,123,136,167],"color":[10,78,89,100,124,139,168],"inpainting":[11,70],"of":[12,21,113],"damaged":[13],"3D":[14,66,165],"objects,":[15],"motivated":[16],"by":[17],"the":[18,33,61,107,147],"digital":[19],"restoration":[20],"cultural":[22],"heritage":[23],"artifacts.":[24],"The":[25,83],"pipeline":[26],"separates":[27],"damage":[28,41,119],"localization":[29],"from":[30,47],"reconstruction.":[31],"In":[32,60],"first":[34],"stage,":[35,63],"2D":[37],"convolutional":[38],"network":[39],"predicts":[40,86],"masks":[42],"on":[43,72,109],"RGB":[44],"slices":[45],"extracted":[46],"voxelized":[49],"object,":[50],"these":[52],"predictions":[53],"are":[54],"aggregated":[55],"into":[56],"volumetric":[58,160],"mask.":[59],"second":[62],"diffusion-based":[65],"U-Net":[67],"performs":[68],"mask-conditioned":[69],"directly":[71],"voxel":[73],"grids,":[74],"reconstructing":[75],"while":[79],"preserving":[80],"observed":[81],"regions.":[82],"model":[84],"jointly":[85],"occupancy":[87,96],"using":[90,120],"composite":[92],"objective":[93],"that":[94,150],"combines":[95],"reconstruction":[97,101],"with":[98,116],"masked":[99],"perceptual":[103],"regularization.":[104],"evaluate":[106],"approach":[108],"curated":[111],"set":[112],"textured":[114],"artifacts":[115],"synthetically":[117],"generated":[118],"standard":[121],"geometric":[122],"metrics.":[125],"Compared":[126],"to":[127,158],"symmetry-based":[128],"baselines,":[129],"our":[130],"method":[131],"produces":[132],"more":[133,137],"complete":[134],"coherent":[138],"reconstructions":[140],"at":[141],"fixed":[143],"32^3":[144],"resolution.":[145],"Overall,":[146],"results":[148],"indicate":[149],"explicit":[151],"mask":[152],"conditioning":[153],"is":[154],"practical":[156],"way":[157],"guide":[159],"diffusion":[161],"models":[162],"inpainting.":[169]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
