{"id":"https://openalex.org/W7138076132","doi":"https://doi.org/10.1609/aaai.v40i12.38012","title":"DiffusionPose: Markov-Optimized Diffusion Model for Human Pose Estimation","display_name":"DiffusionPose: Markov-Optimized Diffusion Model for Human Pose Estimation","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138076132","doi":"https://doi.org/10.1609/aaai.v40i12.38012"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i12.38012","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i12.38012","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38012/41974","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38012/41974","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129682684","display_name":"Zhigang Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhigang Wang","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University"],"affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129728194","display_name":"Zhenguang Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I1302611135","display_name":"Ministry of Public Security of the People's Republic of China","ror":"https://ror.org/00bt9we26","country_code":"CN","type":"government","lineage":["https://openalex.org/I1302611135"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenguang Liu","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University\nShandong Rendui Network Co., Ltd.\nHangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security"],"affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University\nShandong Rendui Network Co., Ltd.\nHangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security","institution_ids":["https://openalex.org/I1302611135"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100777508","display_name":"Shaojing Fan","orcid":"https://orcid.org/0000-0002-7744-1133"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shaojing Fan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129722807","display_name":"Sifan Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sifan Wu","raw_affiliation_strings":["College of Computer Science and Technology, Jilin University\nKey Laboratory of Symbolic Computation and Knowledge Engineering of Ministry of Education, Jilin University"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Jilin University\nKey Laboratory of Symbolic Computation and Knowledge Engineering of Ministry of Education, Jilin University","institution_ids":["https://openalex.org/I194450716"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068056273","display_name":"Yingying Jiao","orcid":null},"institutions":[{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingying Jiao","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University of Technology"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University of Technology","institution_ids":["https://openalex.org/I55712492"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5129682684"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37425595,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"12","first_page":"10412","last_page":"10420"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.7791000008583069,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.7791000008583069,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10114","display_name":"Balance, Gait, and Falls Prevention","score":0.02419999986886978,"subfield":{"id":"https://openalex.org/subfields/3612","display_name":"Physical Therapy, Sports Therapy and Rehabilitation"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.017999999225139618,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6933000087738037},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.645799994468689},{"id":"https://openalex.org/keywords/articulated-body-pose-estimation","display_name":"Articulated body pose estimation","score":0.5956000089645386},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.5734000205993652},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.4977000057697296},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4544999897480011},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.45080000162124634},{"id":"https://openalex.org/keywords/diffusion-process","display_name":"Diffusion process","score":0.4009999930858612}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6935999989509583},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6933000087738037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.667900025844574},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.645799994468689},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.5956000089645386},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.5734000205993652},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.4977000057697296},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4544999897480011},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.45080000162124634},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4260999858379364},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41269999742507935},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.4009999930858612},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.37880000472068787},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34940001368522644},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3379000127315521},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.28139999508857727},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C2778045648","wikidata":"https://www.wikidata.org/wiki/Q176827","display_name":"Markov random field","level":4,"score":0.27730000019073486},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2567000091075897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i12.38012","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i12.38012","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38012/41974","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i12.38012","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i12.38012","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38012/41974","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3657713562","display_name":null,"funder_award_id":"62372402","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138076132.pdf","grobid_xml":"https://content.openalex.org/works/W7138076132.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video-based":[0],"human":[1],"pose":[2,37,57,71,111],"estimation":[3,72],"has":[4],"long":[5],"been":[6],"a":[7,66,127],"nontrivial":[8],"task":[9],"due":[10],"to":[11,35,88,106,130,139,175],"its":[12],"dynamic":[13],"nature":[14],"and":[15,22,55,91],"challenging":[16,160],"detection":[17,42],"scenarios":[18],"such":[19],"as":[20],"occlusion":[21],"defocus.":[23],"Inspired":[24],"by":[25,172],"the":[26,83,102,108,115,132,137,164,167,176,183],"success":[27],"of":[28,110,117,120,166],"diffusion":[29,46,75,104,179],"models,":[30],"researchers":[31],"have":[32],"applied":[33],"them":[34],"video":[36,70,161],"estimation,":[38],"outperforming":[39],"traditional":[40],"joint":[41,171],"methods.":[43],"However,":[44],"existing":[45],"model-based":[47,180],"methods":[48],"still":[49],"face":[50],"challenges":[51],"like":[52],"slow":[53],"convergence":[54],"unstable":[56],"generation.":[58],"To":[59],"tackle":[60],"these":[61],"issues,":[62],"we":[63],"propose":[64],"DiffusionPose,":[65],"novel":[67],"framework":[68],"for":[69],"that":[73],"integrates":[74],"models":[76],"with":[77,86],"optimization":[78],"strategies:":[79],"(1)":[80],"We":[81,96,124],"combine":[82],"emerging":[84],"Mamba":[85],"Transformers":[87],"balance":[89],"global":[90],"local":[92],"spatio-temporal":[93],"modeling.":[94],"(2)":[95],"integrate":[97],"Markov":[98,128],"Random":[99],"Fields":[100],"into":[101],"reverse":[103],"process":[105],"enhance":[107],"denoising":[109,134],"heatmaps,":[112],"particularly":[113],"addressing":[114],"issue":[116],"confused":[118],"generation":[119],"occluded":[121],"joints.":[122],"(3)":[123],"mathematically":[125],"formulate":[126],"objective":[129],"supervise":[131],"heatmap":[133],"process,":[135],"enabling":[136],"model":[138],"generate":[140],"anatomically":[141],"plausible":[142],"skeletons.":[143],"Our":[144],"method":[145,181],"achieves":[146],"state-of-the-art":[147],"performance":[148],"on":[149,182],"three":[150],"large-scale":[151],"benchmark":[152],"datasets.":[153],"Interestingly,":[154],"it":[155],"shows":[156],"surprising":[157],"robustness":[158],"in":[159],"scenarios,":[162],"improving":[163],"accuracy":[165],"most":[168],"difficult":[169],"ankle":[170],"16.9%":[173],"compared":[174],"previous":[177],"best":[178],"Challenging-PoseTrack":[184],"dataset.":[185]},"counts_by_year":[],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2026-03-18T00:00:00"}
