{"id":"https://openalex.org/W4414829299","doi":"https://doi.org/10.48550/arxiv.2504.08654","title":"The Invisible EgoHand: 3D Hand Forecasting through EgoBody Pose Estimation","display_name":"The Invisible EgoHand: 3D Hand Forecasting through EgoBody Pose Estimation","publication_year":2025,"publication_date":"2025-04-11","ids":{"openalex":"https://openalex.org/W4414829299","doi":"https://doi.org/10.48550/arxiv.2504.08654"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2504.08654","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.08654","pdf_url":"https://arxiv.org/pdf/2504.08654","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.08654","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076456457","display_name":"Masashi Hatano","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hatano, Masashi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038683560","display_name":"Zhifan Zhu","orcid":"https://orcid.org/0000-0002-0508-128X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Zhifan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005819073","display_name":"Hideo Sait\u00f4","orcid":"https://orcid.org/0000-0002-2421-9862"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saito, Hideo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003103666","display_name":"Dima Damen","orcid":"https://orcid.org/0000-0001-8804-6238"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Damen, Dima","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076456457"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10648","display_name":"Virtual Reality Applications and Impacts","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6777999997138977},{"id":"https://openalex.org/keywords/articulated-body-pose-estimation","display_name":"Articulated body pose estimation","score":0.6676999926567078},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6420000195503235},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5066999793052673},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4706999957561493},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4047999978065491},{"id":"https://openalex.org/keywords/reprojection-error","display_name":"Reprojection error","score":0.3862999975681305}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7426000237464905},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.705299973487854},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6777999997138977},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.6676999926567078},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6420000195503235},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6190999746322632},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5066999793052673},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4706999957561493},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C23903533","wikidata":"https://www.wikidata.org/wiki/Q17122739","display_name":"Reprojection error","level":3,"score":0.3862999975681305},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3831999897956848},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3409000039100647},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.28999999165534973},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.25780001282691956},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2504.08654","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.08654","pdf_url":"https://arxiv.org/pdf/2504.08654","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2504.08654","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2504.08654","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.08654","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.08654","pdf_url":"https://arxiv.org/pdf/2504.08654","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Forecasting":[0],"hand":[1,45,136,141,151,178,207,213],"motion":[2,114],"and":[3,26,71,82,107,115,142,153,177,185,197,210],"pose":[4,127,214],"from":[5,76],"an":[6,77],"egocentric":[7,78],"perspective":[8],"is":[9],"essential":[10],"for":[11,95,117,150,206,212],"understanding":[12],"human":[13],"intention.":[14],"However,":[15],"existing":[16],"methods":[17],"focus":[18],"solely":[19],"on":[20,135,169,182,187],"predicting":[21],"positions":[22,46],"without":[23],"considering":[24],"articulation,":[25],"only":[27],"when":[28,52,162],"the":[29,34,41,56,68,85,104,121,140,160,170,193,200],"hands":[30,75,119,163],"are":[31,54,164],"visible":[32],"in":[33,81,202],"field":[35,86],"of":[36,73,84,87,120,204],"view.":[37,58,88],"This":[38],"limitation":[39],"overlooks":[40],"fact":[42],"that":[43,158],"approximate":[44],"can":[47],"still":[48],"be":[49],"inferred":[50],"even":[51],"they":[53],"outside":[55],"camera's":[57],"In":[59],"this":[60],"paper,":[61],"we":[62],"propose":[63,90],"a":[64,91,147,154],"method":[65],"to":[66,132],"forecast":[67],"3D":[69,113],"trajectories":[70],"poses":[72,116],"both":[74,80,118],"video,":[79],"out":[83],"We":[89,124,138,166,180],"diffusion-based":[92],"transformer":[93],"architecture":[94],"Egocentric":[96],"Hand":[97],"Forecasting,":[98],"EgoH4,":[99],"which":[100],"takes":[101],"as":[102],"input":[103],"observation":[105],"sequence":[106],"camera":[108,122],"poses,":[109],"then":[110],"predicts":[111],"future":[112],"wearer.":[123],"leverage":[125],"full-body":[126],"information,":[128],"allowing":[129],"other":[130],"joints":[131,144,152],"provide":[133],"constraints":[134],"motion.":[137],"denoise":[139],"body":[143,176],"along":[145],"with":[146,175],"visibility":[148],"predictor":[149],"3D-to-2D":[155],"reprojection":[156],"loss":[157],"minimizes":[159],"error":[161],"in-view.":[165],"evaluate":[167,186],"EgoH4":[168,191],"Ego-Exo4D":[171],"dataset,":[172],"combining":[173],"subsets":[174],"annotations.":[179],"train":[181],"156K":[183],"sequences":[184],"34K":[188],"sequences,":[189],"respectively.":[190],"improves":[192],"performance":[194],"by":[195],"3.4cm":[196],"5.1cm":[198],"over":[199],"baseline":[201],"terms":[203],"ADE":[205],"trajectory":[208],"forecasting":[209],"MPJPE":[211],"forecasting.":[215],"Project":[216],"page:":[217],"https://masashi-hatano.github.io/EgoH4/":[218]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
