{"id":"https://openalex.org/W7155204287","doi":"https://doi.org/10.48550/arxiv.2604.19624","title":"GRAFT: Geometric Refinement and Fitting Transformer for Human Scene Reconstruction","display_name":"GRAFT: Geometric Refinement and Fitting Transformer for Human Scene Reconstruction","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155204287","doi":"https://doi.org/10.48550/arxiv.2604.19624"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19624","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134297673","display_name":"Pradyumna YM","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"YM, Pradyumna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134353613","display_name":"Yuxuan Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Yuxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100454838","display_name":"Yue Chen","orcid":"https://orcid.org/0000-0003-4088-7649"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063262037","display_name":"Nikita Kister","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kister, Nikita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003174716","display_name":"Istv\u00e1n S\u00e1r\u00e1ndi","orcid":"https://orcid.org/0000-0002-5686-3214"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"S\u00e1r\u00e1ndi, Istv\u00e1n","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134225711","display_name":"Gerard Pons-Moll","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pons-Moll, Gerard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.4758000075817108,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.4758000075817108,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.39010000228881836,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.043699998408555984,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/polygon-mesh","display_name":"Polygon mesh","score":0.7562999725341797},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.48660001158714294},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4722999930381775},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.461899995803833},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3702999949455261},{"id":"https://openalex.org/keywords/solid-modeling","display_name":"Solid modeling","score":0.32820001244544983},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.30390000343322754},{"id":"https://openalex.org/keywords/image-quality","display_name":"Image quality","score":0.30239999294281006}],"concepts":[{"id":"https://openalex.org/C31487907","wikidata":"https://www.wikidata.org/wiki/Q1154597","display_name":"Polygon mesh","level":2,"score":0.7562999725341797},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6952999830245972},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5504999756813049},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.48660001158714294},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4722999930381775},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.461899995803833},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40389999747276306},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3702999949455261},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.32820001244544983},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.30390000343322754},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.30239999294281006},{"id":"https://openalex.org/C109950114","wikidata":"https://www.wikidata.org/wiki/Q4464732","display_name":"3D reconstruction","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.29420000314712524},{"id":"https://openalex.org/C2780580889","wikidata":"https://www.wikidata.org/wiki/Q41363","display_name":"Panorama","level":2,"score":0.2939000129699707},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.29249998927116394},{"id":"https://openalex.org/C181095308","wikidata":"https://www.wikidata.org/wiki/Q1541599","display_name":"Geometric primitive","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.28790000081062317},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C7305733","wikidata":"https://www.wikidata.org/wiki/Q207961","display_name":"Geometric shape","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reconstructing":[0],"physically":[1],"plausible":[2],"3D":[3,83],"human-scene":[4],"interactions":[5],"(HSI)":[6],"from":[7],"a":[8,13,63,152],"single":[9],"image":[10,145],"currently":[11],"presents":[12],"trade-off:":[14],"optimization":[15],"based":[16],"methods":[17,160,176],"offer":[18],"accurate":[19],"contact":[20],"but":[21],"are":[22,28],"slow":[23],"(~20s),":[24],"while":[25,186],"feed-forward":[26,53,159,175],"approaches":[27],"fast":[29,52],"yet":[30],"lack":[31],"explicit":[32],"interaction":[33,92,167,180],"reasoning,":[34],"producing":[35],"floating":[36],"and":[37,121,134,177,193],"interpenetration":[38],"artifacts.":[39],"Our":[40],"key":[41],"insight":[42],"is":[43],"that":[44,67,74,107,157],"geometry-based":[45],"human--scene":[46],"fitting":[47],"can":[48],"be":[49],"amortized":[50],"into":[51,94],"inference.":[54],"We":[55],"present":[56],"GRAFT":[57,89,137,165],"(Geometric":[58],"Refinement":[59],"And":[60],"Fitting":[61],"Transformer),":[62],"learned":[64,132],"HSI":[65,155],"prior":[66,156],"predicts":[68],"Interaction":[69],"Gradients:":[70],"corrective":[71],"parameter":[72],"updates":[73,118],"iteratively":[75],"refine":[76],"human":[77,119],"meshes":[78,120],"by":[79,169],"reasoning":[80],"about":[81],"their":[82],"relationship":[84],"to":[85,171,189],"the":[86,91,101,123,126],"surrounding":[87],"scene.":[88],"encodes":[90],"state":[93],"compact":[95],"body-anchored":[96],"tokens,":[97],"each":[98],"grounded":[99],"in":[100,196],"scene":[102],"geometry":[103,149],"via":[104],"Geometric":[105],"Probes":[106],"capture":[108],"spatial":[109],"relationships":[110],"with":[111,130,148],"nearby":[112],"surfaces.":[113],"A":[114],"lightweight":[115],"transformer":[116],"recurrently":[117],"re-probes":[122],"scene,":[124],"ensuring":[125],"final":[127],"pose":[128],"aligns":[129],"both":[131],"priors":[133],"observed":[135],"geometry.":[136],"operates":[138],"either":[139],"as":[140,151],"an":[141],"end-to-end":[142],"reconstructor":[143],"using":[144],"features,":[146],"or":[147],"alone":[150],"transferable":[153],"plug-and-play":[154],"improves":[158,166],"without":[161],"retraining.":[162],"Experiments":[163],"show":[164],"quality":[168,181],"up":[170],"113%":[172],"over":[173],"state-of-the-art":[174],"matches":[178],"optimization-based":[179],"at":[182],"${\\sim}50{\\times}$":[183],"lower":[184],"runtime,":[185],"generalizing":[187],"seamlessly":[188],"in-the-wild":[190],"multi-person":[191],"scenes":[192],"being":[194],"preferred":[195],"64.8%":[197],"of":[198],"three-way":[199],"user":[200],"study.":[201],"Project":[202],"page:":[203],"https://pradyumnaym.github.io/graft":[204],".":[205]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
