{"id":"https://openalex.org/W4394775924","doi":"https://doi.org/10.1109/3dv69130.2026.00071","title":"Reconstructing Hand-Held Objects in 3D from Images and Videos","display_name":"Reconstructing Hand-Held Objects in 3D from Images and Videos","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W4394775924","doi":"https://doi.org/10.1109/3dv69130.2026.00071"},"language":"en","primary_location":{"id":"doi:10.1109/3dv69130.2026.00071","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00071","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.06507","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008942444","display_name":"Jane Y. Wu","orcid":"https://orcid.org/0000-0003-1794-1213"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jane Wu","raw_affiliation_strings":["UC Berkeley"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052269532","display_name":"Georgios Pavlakos","orcid":"https://orcid.org/0000-0001-5821-1909"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Georgios Pavlakos","raw_affiliation_strings":["UT Austin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UT Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014407395","display_name":"Georgia Gkioxari","orcid":null},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Georgia Gkioxari","raw_affiliation_strings":["Caltech"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Caltech","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001594573","display_name":"Jitendra Malik","orcid":"https://orcid.org/0000-0003-3695-1580"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jitendra Malik","raw_affiliation_strings":["UC Berkeley"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00115637,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"681","last_page":"692"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12874","display_name":"Digital Imaging for Blood Diseases","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.8245800733566284},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7828617691993713},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7452932000160217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7444437146186829},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5469040274620056},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.546289324760437},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.49835634231567383},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.49563610553741455},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.45132768154144287},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.44954153895378113},{"id":"https://openalex.org/keywords/object-model","display_name":"Object model","score":0.41869065165519714},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3466287851333618},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.09274032711982727},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.06663250923156738}],"concepts":[{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.8245800733566284},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7828617691993713},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7452932000160217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7444437146186829},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5469040274620056},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.546289324760437},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.49835634231567383},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.49563610553741455},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.45132768154144287},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.44954153895378113},{"id":"https://openalex.org/C20894473","wikidata":"https://www.wikidata.org/wiki/Q1116105","display_name":"Object model","level":3,"score":0.41869065165519714},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3466287851333618},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.09274032711982727},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.06663250923156738},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/3dv69130.2026.00071","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00071","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2404.06507","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.06507","pdf_url":"https://arxiv.org/pdf/2404.06507","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2404.06507","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.06507","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.06507","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.06507","pdf_url":"https://arxiv.org/pdf/2404.06507","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3452063466","display_name":null,"funder_award_id":"N00014-21-1-2801","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320333591","display_name":"Multidisciplinary University Research Initiative","ror":null},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"},{"id":"https://openalex.org/F4320337380","display_name":"Division of Mathematical Sciences","ror":"https://ror.org/051fftw81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4287280733","https://openalex.org/W3213573742","https://openalex.org/W2128203364","https://openalex.org/W2026565050","https://openalex.org/W3136070008","https://openalex.org/W2108712229","https://openalex.org/W2161198505","https://openalex.org/W2367015181","https://openalex.org/W2048280641","https://openalex.org/W3035117168"],"abstract_inverted_index":{"Objects":[0],"manipulated":[1],"by":[2],"the":[3,18,23,27,41,57,62,66,124,171,174,192,199,233],"hand":[4,19,138,150],"(i.e.,":[5],"manipulanda)":[6],"are":[7],"particularly":[8],"challenging":[9],"to":[10,73,111,122,163],"reconstruct":[11,112],"from":[12],"Internet":[13,222],"videos.":[14],"Not":[15],"only":[16,31],"does":[17],"occlude":[20],"much":[21],"of":[22,37,61,68],"object,":[24,63],"but":[25],"also":[26],"object":[28,89,102,114,140,167,172,186],"is":[29,70,194],"often":[30],"visible":[32],"in":[33,48,80,96,116,173,206],"a":[34,84,105,143,156,161,165,207],"small":[35,71],"number":[36],"image":[38,146],"pixels.":[39],"At":[40],"same":[42],"time,":[43],"two":[44],"strong":[45],"anchors":[46],"emerge":[47],"this":[49,178],"setting:":[50],"(1)":[51],"estimated":[52],"3D":[53,101,149,166,203],"hands":[54],"help":[55],"disambiguate":[56],"location":[58],"and":[59,64,100,139,147,191,202,221,229],"scale":[60],"(2)":[65],"set":[67],"manipulanda":[69],"relative":[72],"all":[74,189],"possible":[75],"objects.":[76],"With":[77],"these":[78],"insights":[79],"mind,":[81],"we":[82,109,130,154,176],"present":[83,132],"scalable":[85],"paradigm":[86],"for":[87],"hand-held":[88,113],"reconstruction":[90],"that":[91,169,213],"builds":[92],"on":[93,219,232],"recent":[94],"breakthroughs":[95],"large":[97],"language/vision":[98],"models":[99,230],"datasets.":[103,224],"Given":[104],"monocular":[106],"RGB":[107,145],"video,":[108],"aim":[110],"geometry":[115,141,187],"3D,":[117],"over":[118],"time.":[119],"In":[120],"order":[121],"obtain":[123],"best":[125],"performing":[126],"single":[127,144],"frame":[128],"model,":[129],"first":[131],"MCC-Hand-Object":[133],"(MCCHO),":[134],"which":[135],"jointly":[136],"reconstructs":[137],"given":[142],"inferred":[148],"as":[151],"inputs.":[152],"Subsequently,":[153],"prompt":[155],"text-to-3D":[157],"generative":[158],"model":[159,168],"using":[160],"VLM":[162],"retrieve":[164],"matches":[170],"image(s);":[175],"call":[177],"alignment":[179],"Retrieval-Augmented":[180],"Reconstruction":[181],"(RAR).":[182],"RAR":[183],"provides":[184],"unified":[185],"across":[188],"frames,":[190],"result":[193],"rigidly":[195],"aligned":[196],"with":[197],"both":[198],"input":[200],"images":[201],"MCCHO":[204],"observations":[205],"temporally":[208],"consistent":[209],"manner.":[210],"Experiments":[211],"demonstrate":[212],"our":[214,227],"approach":[215],"achieves":[216],"state-of-theart":[217],"performance":[218],"lab":[220],"image/video":[223],"We":[225],"make":[226],"code":[228],"available":[231],"project":[234],"website:":[235],"https://janehwu.github.io/mcc-ho":[236]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2024-04-13T00:00:00"}
