{"id":"https://openalex.org/W4416286421","doi":"https://doi.org/10.1109/tpami.2025.3633453","title":"MADiff: Motion-Aware Mamba Diffusion Models for Hand Trajectory Prediction on Egocentric Videos","display_name":"MADiff: Motion-Aware Mamba Diffusion Models for Hand Trajectory Prediction on Egocentric Videos","publication_year":2025,"publication_date":"2025-11-17","ids":{"openalex":"https://openalex.org/W4416286421","doi":"https://doi.org/10.1109/tpami.2025.3633453","pmid":"https://pubmed.ncbi.nlm.nih.gov/41247909"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3633453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3633453","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059313602","display_name":"Junyi Ma","orcid":"https://orcid.org/0000-0002-2453-0001"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210157642","display_name":"Institute of Automation","ror":"https://ror.org/056qj1t15","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210157642","https://openalex.org/I78650965"]}],"countries":["CN","DE"],"is_corresponding":true,"raw_author_name":"Junyi Ma","raw_affiliation_strings":["IRMV Lab, School of Automation and Intelligent Sensing, Shanghai Jiao Tong University, Shanghai, China","IRMV Lab, the Department of AutomationShanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"IRMV Lab, School of Automation and Intelligent Sensing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"IRMV Lab, the Department of AutomationShanghai Jiao Tong University","institution_ids":["https://openalex.org/I4210157642"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032262344","display_name":"Xieyuanli Chen","orcid":"https://orcid.org/0000-0003-0955-6681"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]},{"id":"https://openalex.org/I4210145386","display_name":"National Intelligence University","ror":"https://ror.org/049sfwc36","country_code":"US","type":"education","lineage":["https://openalex.org/I4210145386"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Xieyuanli Chen","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","College of Intelligence Science and TechnologyNational University of Defense Technology"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"College of Intelligence Science and TechnologyNational University of Defense Technology","institution_ids":["https://openalex.org/I4210145386"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009570447","display_name":"Wentao Bao","orcid":"https://orcid.org/0000-0003-2571-3341"},"institutions":[{"id":"https://openalex.org/I1298563314","display_name":"ActionAid","ror":"https://ror.org/01pgn1y88","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298563314"]},{"id":"https://openalex.org/I4210093880","display_name":"Research for Action","ror":"https://ror.org/00jc5v027","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210093880"]},{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wentao Bao","raw_affiliation_strings":["ACTION Lab, Department of Computer Science and Engineering, Michigan State University, MI, USA","ACTION Lab, the Department of Computer Science and EngineeringMichigan State University"],"affiliations":[{"raw_affiliation_string":"ACTION Lab, Department of Computer Science and Engineering, Michigan State University, MI, USA","institution_ids":["https://openalex.org/I4210093880","https://openalex.org/I87216513"]},{"raw_affiliation_string":"ACTION Lab, the Department of Computer Science and EngineeringMichigan State University","institution_ids":["https://openalex.org/I1298563314"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100610904","display_name":"Jingyi Xu","orcid":"https://orcid.org/0000-0001-6082-4181"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyi Xu","raw_affiliation_strings":["Department of Electronic Engineering, Shanghai Jiao Tong University, Shanghai, China","Department of Electronic EngineeringShanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"Department of Electronic EngineeringShanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107772128","display_name":"Hesheng Wang","orcid":"https://orcid.org/0000-0002-9959-1634"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210157642","display_name":"Institute of Automation","ror":"https://ror.org/056qj1t15","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210157642","https://openalex.org/I78650965"]}],"countries":["CN","DE"],"is_corresponding":false,"raw_author_name":"Hesheng Wang","raw_affiliation_strings":["IRMV Lab, School of Automation and Intelligent Sensing, Shanghai Jiao Tong University, Shanghai, China","IRMV Lab, the Department of AutomationShanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"IRMV Lab, School of Automation and Intelligent Sensing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"IRMV Lab, the Department of AutomationShanghai Jiao Tong University","institution_ids":["https://openalex.org/I4210157642"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5059313602"],"corresponding_institution_ids":["https://openalex.org/I183067930","https://openalex.org/I4210157642"],"apc_list":null,"apc_paid":null,"fwci":7.0483,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.97196464,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"48","issue":"3","first_page":"3250","last_page":"3267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9017000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9017000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.02459999918937683,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.024299999698996544,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7063999772071838},{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.6141999959945679},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6126000285148621},{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.4375999867916107},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4066999852657318},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.37310001254081726},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3666999936103821}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7573000192642212},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7305999994277954},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7063999772071838},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6186000108718872},{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.6141999959945679},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6126000285148621},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.4375999867916107},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4066999852657318},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3666999936103821},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3100999891757965},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.3077999949455261},{"id":"https://openalex.org/C2781271823","wikidata":"https://www.wikidata.org/wiki/Q138081","display_name":"Waypoint","level":2,"score":0.3070000112056732},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2612000107765198},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2524999976158142}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3633453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3633453","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41247909","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41247909","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W1510835000","https://openalex.org/W2055111849","https://openalex.org/W2071634722","https://openalex.org/W2085261163","https://openalex.org/W2136668269","https://openalex.org/W2151103935","https://openalex.org/W2194775991","https://openalex.org/W2605973302","https://openalex.org/W2736345552","https://openalex.org/W2741156154","https://openalex.org/W2763331099","https://openalex.org/W2768683308","https://openalex.org/W2777926144","https://openalex.org/W2895299763","https://openalex.org/W2896457183","https://openalex.org/W2914885528","https://openalex.org/W2963337691","https://openalex.org/W3005621653","https://openalex.org/W3013785695","https://openalex.org/W3021065276","https://openalex.org/W3034891989","https://openalex.org/W3037046522","https://openalex.org/W3096609285","https://openalex.org/W3109667662","https://openalex.org/W3132408010","https://openalex.org/W3138516171","https://openalex.org/W3139491754","https://openalex.org/W3170924787","https://openalex.org/W3184612208","https://openalex.org/W3202237431","https://openalex.org/W3204872899","https://openalex.org/W3205786327","https://openalex.org/W3207758636","https://openalex.org/W4214751560","https://openalex.org/W4233641747","https://openalex.org/W4312255464","https://openalex.org/W4312309917","https://openalex.org/W4312769771","https://openalex.org/W4312923690","https://openalex.org/W4312928145","https://openalex.org/W4313024976","https://openalex.org/W4383108698","https://openalex.org/W4385245566","https://openalex.org/W4385789109","https://openalex.org/W4385801288","https://openalex.org/W4386065350","https://openalex.org/W4386066475","https://openalex.org/W4386072118","https://openalex.org/W4386075525","https://openalex.org/W4386076108","https://openalex.org/W4386076596","https://openalex.org/W4386172462","https://openalex.org/W4386180992","https://openalex.org/W4387741824","https://openalex.org/W4388430502","https://openalex.org/W4389518872","https://openalex.org/W4390872031","https://openalex.org/W4390872045","https://openalex.org/W4390872828","https://openalex.org/W4390889757","https://openalex.org/W4393078841","https://openalex.org/W4394596846","https://openalex.org/W4394625615","https://openalex.org/W4394625740","https://openalex.org/W4396215030","https://openalex.org/W4396594800","https://openalex.org/W4400527593","https://openalex.org/W4402660087","https://openalex.org/W4402775763","https://openalex.org/W4402996870","https://openalex.org/W4403337227","https://openalex.org/W4403488223","https://openalex.org/W4403908521","https://openalex.org/W4405386924","https://openalex.org/W4416748449"],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"human":[1,33,48],"intentions":[2,49],"and":[3,42,71,141,155,175],"actions":[4],"through":[5],"egocentric":[6,21,59],"videos":[7,60],"is":[8,55,65,115,127],"important":[9],"on":[10,168],"the":[11,72,80,112,123,137,173,190],"path":[12],"to":[13,77,129,158,189],"embodied":[14],"artificial":[15],"intelligence.":[16],"As":[17],"a":[18,28,91,149],"branch":[19],"of":[20,74,82],"vision":[22],"techniques,":[23],"hand":[24,83,93,102,186],"trajectory":[25,94],"prediction":[26,95],"plays":[27],"vital":[29],"role":[30],"in":[31,39,111],"comprehending":[32],"motion":[34],"patterns,":[35],"benefiting":[36],"downstream":[37],"tasks":[38],"extended":[40],"reality":[41],"robot":[43],"manipulation.":[44],"However,":[45],"capturing":[46],"high-level":[47,160],"consistent":[50],"with":[51,104,172],"reasonable":[52,185],"temporal":[53],"causality":[54],"challenging":[56],"when":[57],"only":[58],"are":[61],"available.":[62],"This":[63],"difficulty":[64],"exacerbated":[66],"under":[67],"camera":[68,124],"egomotion":[69,126],"interference":[70],"absence":[73],"affordance":[75,145],"labels":[76],"explicitly":[78],"guide":[79],"optimization":[81],"waypoint":[84],"distribution.":[85],"In":[86],"this":[87],"work,":[88],"we":[89,147],"propose":[90],"novel":[92],"method":[96],"dubbed":[97],"MADiff,":[98],"which":[99],"forecasts":[100],"future":[101],"waypoints":[103],"diffusion":[105],"models.":[106],"The":[107],"devised":[108],"denoising":[109],"operation":[110],"latent":[113],"space":[114],"achieved":[116],"by":[117],"our":[118,176],"proposed":[119],"motion-aware":[120],"Mamba,":[121],"where":[122],"wearer's":[125],"integrated":[128],"achieve":[130],"motion-driven":[131],"selective":[132],"scan":[133],"(MDSS).":[134],"To":[135],"discern":[136],"relationship":[138],"between":[139],"hands":[140],"scenarios":[142],"without":[143],"explicit":[144],"supervision,":[146],"leverage":[148],"foundation":[150],"model":[151],"that":[152,181],"fuses":[153],"visual":[154],"language":[156],"features":[157],"capture":[159],"semantics":[161],"from":[162],"video":[163],"clips.":[164],"Comprehensive":[165],"experiments":[166],"conducted":[167],"five":[169],"public":[170],"datasets":[171],"existing":[174],"new":[177],"evaluation":[178],"metrics":[179],"demonstrate":[180],"MADiff":[182],"predicts":[183],"comparably":[184],"trajectories":[187],"compared":[188],"state-of-the-art":[191],"baselines.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-11-17T00:00:00"}
