{"id":"https://openalex.org/W4312851679","doi":"https://doi.org/10.1109/tcsvt.2022.3213206","title":"UformPose: A U-Shaped Hierarchical Multi-Scale Keypoint-Aware Framework for Human Pose Estimation","display_name":"UformPose: A U-Shaped Hierarchical Multi-Scale Keypoint-Aware Framework for Human Pose Estimation","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4312851679","doi":"https://doi.org/10.1109/tcsvt.2022.3213206"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2022.3213206","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2022.3213206","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082708885","display_name":"Youjie Wang","orcid":"https://orcid.org/0000-0001-7031-2972"},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"You-Jie Wang","raw_affiliation_strings":["Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China","institution_ids":["https://openalex.org/I119045251"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091302785","display_name":"Yanmin Luo","orcid":"https://orcid.org/0000-0001-7596-3299"},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan-Min Luo","raw_affiliation_strings":["Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China","institution_ids":["https://openalex.org/I119045251"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002400033","display_name":"Guihu Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I119045251","display_name":"Huaqiao University","ror":"https://ror.org/03frdh605","country_code":"CN","type":"education","lineage":["https://openalex.org/I119045251"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gui-Hu Bai","raw_affiliation_strings":["Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory for Computer Vision and Pattern Recognition and the College of Computer Science and Technology, Huaqiao University, Xiamen, China","institution_ids":["https://openalex.org/I119045251"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089868194","display_name":"Jing-Ming Guo","orcid":"https://orcid.org/0000-0002-8041-6326"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jing-Ming Guo","raw_affiliation_strings":["Department of Electrical Engineering, National Taiwan University of Science and Technology, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5082708885"],"corresponding_institution_ids":["https://openalex.org/I119045251"],"apc_list":null,"apc_paid":null,"fwci":2.0132,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.88238692,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"33","issue":"4","first_page":"1697","last_page":"1709"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7840306162834167},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7597554922103882},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7219762206077576},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7204108834266663},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.6851342916488647},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5329201221466064},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4430190920829773},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.41979825496673584},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41863563656806946},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4176506996154785},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41338881850242615},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.40448102355003357},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09643247723579407},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.067446768283844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7840306162834167},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7597554922103882},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7219762206077576},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7204108834266663},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.6851342916488647},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5329201221466064},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4430190920829773},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.41979825496673584},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41863563656806946},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4176506996154785},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41338881850242615},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.40448102355003357},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09643247723579407},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.067446768283844},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2022.3213206","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2022.3213206","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/17"}],"awards":[{"id":"https://openalex.org/G8006388478","display_name":null,"funder_award_id":"2020J01082","funder_id":"https://openalex.org/F4320321878","funder_display_name":"Natural Science Foundation of Fujian Province"}],"funders":[{"id":"https://openalex.org/F4320321878","display_name":"Natural Science Foundation of Fujian Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":60,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1861492603","https://openalex.org/W1901129140","https://openalex.org/W2112796928","https://openalex.org/W2175012183","https://openalex.org/W2194775991","https://openalex.org/W2307770531","https://openalex.org/W2559085405","https://openalex.org/W2617321867","https://openalex.org/W2891330063","https://openalex.org/W2907137919","https://openalex.org/W2916798096","https://openalex.org/W2942932288","https://openalex.org/W2962820842","https://openalex.org/W2962954622","https://openalex.org/W2963073614","https://openalex.org/W2963150697","https://openalex.org/W2963402313","https://openalex.org/W2963598138","https://openalex.org/W2963781481","https://openalex.org/W2964105113","https://openalex.org/W2964221239","https://openalex.org/W2964297864","https://openalex.org/W2964304707","https://openalex.org/W2986760165","https://openalex.org/W3022710535","https://openalex.org/W3034399482","https://openalex.org/W3034750257","https://openalex.org/W3039961680","https://openalex.org/W3092462694","https://openalex.org/W3117707723","https://openalex.org/W3131500599","https://openalex.org/W3136416617","https://openalex.org/W3138516171","https://openalex.org/W3159818808","https://openalex.org/W3171707680","https://openalex.org/W3176892444","https://openalex.org/W3199613405","https://openalex.org/W3203572876","https://openalex.org/W3203925315","https://openalex.org/W3206810688","https://openalex.org/W4213207977","https://openalex.org/W4214588794","https://openalex.org/W4229911490","https://openalex.org/W4287259027","https://openalex.org/W4293584584","https://openalex.org/W4312950730","https://openalex.org/W6631190155","https://openalex.org/W6729677316","https://openalex.org/W6730410022","https://openalex.org/W6739901393","https://openalex.org/W6750227808","https://openalex.org/W6754577284","https://openalex.org/W6757658208","https://openalex.org/W6761440607","https://openalex.org/W6784094891","https://openalex.org/W6787906798","https://openalex.org/W6791517108","https://openalex.org/W6801589178","https://openalex.org/W6802010497"],"related_works":["https://openalex.org/W2123263858","https://openalex.org/W3127959533","https://openalex.org/W4249847449","https://openalex.org/W2894986065","https://openalex.org/W44395729","https://openalex.org/W4387967917","https://openalex.org/W4287600488","https://openalex.org/W4206776094","https://openalex.org/W1996690921","https://openalex.org/W3121197456"],"abstract_inverted_index":{"Human":[0],"pose":[1,34,143],"estimation":[2,35,144],"is":[3,64],"a":[4,32,65],"fundamental":[5],"yet":[6],"challenging":[7],"task":[8],"in":[9,163],"computer":[10],"vision.":[11],"However,":[12],"difficult":[13],"scenarios":[14],"such":[15],"as":[16],"invisible":[17],"keypoints,":[18],"occlusions":[19],"and":[20,55,81,126,152],"small-scale":[21],"persons":[22],"are":[23],"still":[24],"not":[25],"well-handed.":[26],"In":[27],"this":[28],"paper,":[29],"we":[30,113],"present":[31],"novel":[33],"framework":[36,139],"named":[37],"UformPose":[38,45],"which":[39,123],"targets":[40],"to":[41,72,93],"relieve":[42],"these":[43],"issues.":[44],"has":[46],"two":[47],"core":[48],"designs:":[49],"Shared":[50],"Feature":[51],"Pyramid":[52],"Stem":[53],"(SFPS)":[54],"U-shaped":[56],"hierarchical":[57],"Multi-scale":[58],"Keypoint-aware":[59],"Attention":[60],"Module":[61],"(U-MKAM).":[62],"SFPS":[63],"feature":[66,103],"pyramid":[67],"stem":[68],"with":[69],"shared":[70,83],"mechanism":[71,84],"learn":[73],"stronger":[74],"low-level":[75],"features":[76],"at":[77],"the":[78,82,106,115,128,135,141,147,158],"initial":[79],"stage,":[80],"can":[85],"facilitate":[86],"cross-resolution":[87],"commonality":[88],"learning.":[89],"Our":[90],"U-MKAM":[91],"attempts":[92],"generate":[94],"high-quality":[95],"high-resolution":[96],"representations":[97],"by":[98,109],"integrating":[99],"all":[100],"levels":[101],"of":[102,105,117,137,160],"representation":[104],"backbone":[107],"layer":[108],"layer.":[110],"More":[111],"importantly,":[112],"utilize":[114],"flexibility":[116],"attention":[118],"operations":[119],"for":[120],"keypoint-aware":[121],"modeling,":[122],"explicitly":[124],"captures":[125],"trades-offs":[127],"dependencies":[129],"between":[130],"keypoints.":[131],"We":[132],"empirically":[133],"demonstrate":[134,157],"effectiveness":[136],"our":[138,161],"through":[140],"competitive":[142],"results":[145],"on":[146,155],"COCO":[148],"dataset.":[149],"Extensive":[150],"experiments":[151],"visual":[153],"analysis":[154],"CrowdPose":[156],"robustness":[159],"model":[162],"crowd":[164],"scenes.":[165]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
