{"id":"https://openalex.org/W4386065736","doi":"https://doi.org/10.1109/cvpr52729.2023.00215","title":"DistilPose: Tokenized Pose Regression with Heatmap Distillation","display_name":"DistilPose: Tokenized Pose Regression with Heatmap Distillation","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4386065736","doi":"https://doi.org/10.1109/cvpr52729.2023.00215"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52729.2023.00215","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.00215","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014036987","display_name":"Suhang Ye","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Suhang Ye","raw_affiliation_strings":["Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100685570","display_name":"Yingyi Zhang","orcid":"https://orcid.org/0000-0003-1398-8903"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingyi Zhang","raw_affiliation_strings":["Tencent Youtu Lab"],"affiliations":[{"raw_affiliation_string":"Tencent Youtu Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100679572","display_name":"Jie Hu","orcid":"https://orcid.org/0000-0002-3187-1656"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Hu","raw_affiliation_strings":["Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014628588","display_name":"Liujuan Cao","orcid":"https://orcid.org/0000-0002-7645-9606"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liujuan Cao","raw_affiliation_strings":["Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012257365","display_name":"Shengchuan Zhang","orcid":"https://orcid.org/0000-0002-0824-4945"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengchuan Zhang","raw_affiliation_strings":["Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091517359","display_name":"Lei Shen","orcid":"https://orcid.org/0000-0002-3154-0574"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Shen","raw_affiliation_strings":["Tencent Youtu Lab"],"affiliations":[{"raw_affiliation_string":"Tencent Youtu Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100384874","display_name":"Jun Wang","orcid":"https://orcid.org/0000-0003-1581-8369"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Wang","raw_affiliation_strings":["Tencent WeChat Pay Lab33"],"affiliations":[{"raw_affiliation_string":"Tencent WeChat Pay Lab33","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086397952","display_name":"Shouhong Ding","orcid":"https://orcid.org/0000-0002-3175-3553"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shouhong Ding","raw_affiliation_strings":["Tencent Youtu Lab"],"affiliations":[{"raw_affiliation_string":"Tencent Youtu Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016080094","display_name":"Rongrong Ji","orcid":"https://orcid.org/0000-0001-9163-2932"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongrong Ji","raw_affiliation_strings":["Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5014036987"],"corresponding_institution_ids":["https://openalex.org/I191208505"],"apc_list":null,"apc_paid":null,"fwci":3.5666,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.94503135,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2163","last_page":"2172"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11227","display_name":"Diabetic Foot Ulcer Assessment and Management","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2712","display_name":"Endocrinology, Diabetes and Metabolism"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8030742406845093},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.6128338575363159},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5877947807312012},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.5487698316574097},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5233007073402405},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4898471534252167},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.4639294743537903},{"id":"https://openalex.org/keywords/cross-validation","display_name":"Cross-validation","score":0.4120227098464966},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38290753960609436},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32546883821487427},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.23807069659233093},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.08380496501922607},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08171644806861877}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8030742406845093},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.6128338575363159},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5877947807312012},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.5487698316574097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5233007073402405},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4898471534252167},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.4639294743537903},{"id":"https://openalex.org/C27181475","wikidata":"https://www.wikidata.org/wiki/Q541014","display_name":"Cross-validation","level":2,"score":0.4120227098464966},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38290753960609436},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32546883821487427},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.23807069659233093},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.08380496501922607},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08171644806861877},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52729.2023.00215","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.00215","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G4229650515","display_name":null,"funder_award_id":"2022ZD0118202","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G6075090814","display_name":null,"funder_award_id":"62025603","funder_id":"https://openalex.org/F4320336125","funder_display_name":"National Science Fund for Distinguished Young Scholars"},{"id":"https://openalex.org/G734838997","display_name":null,"funder_award_id":"U21B2037,U22B2051,62176222,62176223,62176226,62072386,62072387,62072389,62002305,62272401","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323021","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336125","display_name":"National Science Fund for Distinguished Young Scholars","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1821462560","https://openalex.org/W1861492603","https://openalex.org/W1936750108","https://openalex.org/W1983363688","https://openalex.org/W2113325037","https://openalex.org/W2119350939","https://openalex.org/W2136391815","https://openalex.org/W2307770531","https://openalex.org/W2578797046","https://openalex.org/W2916798096","https://openalex.org/W2963402313","https://openalex.org/W2963598138","https://openalex.org/W2964062189","https://openalex.org/W2988211500","https://openalex.org/W2993728126","https://openalex.org/W3010526057","https://openalex.org/W3034742259","https://openalex.org/W3034750257","https://openalex.org/W3158818292","https://openalex.org/W3172801447","https://openalex.org/W3176892444","https://openalex.org/W3187458216","https://openalex.org/W3203925315","https://openalex.org/W4200254818","https://openalex.org/W4214508443","https://openalex.org/W4224992933","https://openalex.org/W4229890965","https://openalex.org/W4285300683","https://openalex.org/W4292787098","https://openalex.org/W4312914534","https://openalex.org/W4313119505","https://openalex.org/W4385245566","https://openalex.org/W6638523607","https://openalex.org/W6639102338","https://openalex.org/W6697925102","https://openalex.org/W6739901393","https://openalex.org/W6745881451","https://openalex.org/W6750378959","https://openalex.org/W6760424586","https://openalex.org/W6769884363","https://openalex.org/W6794073987","https://openalex.org/W6796721132","https://openalex.org/W6809664228","https://openalex.org/W6810565296"],"related_works":["https://openalex.org/W4289356671","https://openalex.org/W2389155397","https://openalex.org/W2165884543","https://openalex.org/W2312753042","https://openalex.org/W3186837933","https://openalex.org/W2368989808","https://openalex.org/W2034959125","https://openalex.org/W2355687852","https://openalex.org/W3174513558","https://openalex.org/W2114200869"],"abstract_inverted_index":{"In":[0,37],"the":[1,52,62,67,72,85,115,121,124,132],"field":[2],"of":[3,14,24,30,64,88,123],"human":[4,44],"pose":[5,45],"estimation,":[6],"regression-based":[7,57,91,125,183],"methods":[8,18],"have":[9],"been":[10],"dominated":[11],"in":[12,22],"terms":[13,23],"speed,":[15],"while":[16,96,127],"heatmap-based":[17,55,89],"are":[19],"far":[20],"ahead":[21],"performance.":[25],"How":[26],"to":[27,71],"take":[28],"advantage":[29],"both":[31],"schemes":[32],"remains":[33],"a":[34,42,178],"challenging":[35],"problem.":[36],"this":[38],"paper,":[39],"we":[40],"propose":[41],"novel":[43],"estimation":[46],"framework":[47],"termed":[48],"DistilPose,":[49],"which":[50,148],"bridges":[51],"gaps":[53],"between":[54],"and":[56,80,90,103,145,154],"methods.":[58],"Specifically,":[59,130],"DistilPose":[60,117],"maximizes":[61],"transfer":[63,99],"knowledge":[65],"from":[66,105],"teacher":[68,106,160],"model":[69,74,161],"(heatmap-based)":[70],"student":[73,109],"(regression-based)":[75],"through":[76],"Token-distilling":[77],"Encoder":[78],"(TDE)":[79],"Simulated":[81,97],"Heatmaps.":[82],"TDE":[83],"aligns":[84],"feature":[86],"spaces":[87],"models":[92,126],"by":[93],"introducing":[94],"tokenization,":[95],"Heatmaps":[98],"explicit":[100],"guidance":[101],"(distribution":[102],"confidence)":[104],"heatmaps":[107],"into":[108],"models.":[110,184],"Extensive":[111],"experiments":[112],"show":[113],"that":[114],"proposed":[116],"can":[118],"significantly":[119],"improve":[120],"performance":[122,166],"maintaining":[128],"efficiency.":[129],"on":[131,173],"MSCOCO":[133,174],"validation":[134,175],"dataset,":[135,176],"DistilPose-S":[136],"obtains":[137,170],"71.6%":[138],"mAP":[139,172],"with":[140,162],"5.36M":[141],"parameters,":[142],"2.38":[143],"GFLOPs,":[144],"40.2":[146],"FPS,":[147],"saves":[149],"12.95\u00d7,":[150],"7.16\u00d7":[151],"computational":[152],"cost":[153],"is":[155],"4.9\u00d7":[156],"faster":[157],"than":[158],"its":[159],"only":[163],"0.9":[164],"points":[165],"drop.":[167],"Furthermore,":[168],"DistilPose-L":[169],"74.4%":[171],"achieving":[177],"new":[179],"state-of-the-art":[180],"among":[181],"predominant":[182],"Code":[185],"will":[186],"be":[187],"available":[188],"at":[189],"https://github.com/yshMars/DistilPose.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
