{"id":"https://openalex.org/W4387272119","doi":"https://doi.org/10.1109/tmm.2023.3321438","title":"Global and Local Spatio-Temporal Encoder for 3D Human Pose Estimation","display_name":"Global and Local Spatio-Temporal Encoder for 3D Human Pose Estimation","publication_year":2023,"publication_date":"2023-10-02","ids":{"openalex":"https://openalex.org/W4387272119","doi":"https://doi.org/10.1109/tmm.2023.3321438"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3321438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3321438","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001918537","display_name":"Yong Wang","orcid":"https://orcid.org/0000-0002-7847-3807"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yong Wang","raw_affiliation_strings":["School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China"],"raw_orcid":"https://orcid.org/0000-0002-7847-3807","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023482373","display_name":"Hongbo Kang","orcid":"https://orcid.org/0000-0001-5771-3886"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongbo Kang","raw_affiliation_strings":["School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China"],"raw_orcid":"https://orcid.org/0000-0001-5771-3886","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028793404","display_name":"Doudou Wu","orcid":"https://orcid.org/0000-0002-5189-8565"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Doudou Wu","raw_affiliation_strings":["School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China"],"raw_orcid":"https://orcid.org/0000-0002-5189-8565","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026184280","display_name":"Wenming Yang","orcid":"https://orcid.org/0000-0002-2506-1286"},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenming Yang","raw_affiliation_strings":["Shenzhen International Graduate School, Department of Electronic Engineering, Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-2506-1286","affiliations":[{"raw_affiliation_string":"Shenzhen International Graduate School, Department of Electronic Engineering, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002794703","display_name":"Longbin Zhang","orcid":"https://orcid.org/0000-0001-8785-5885"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Longbin Zhang","raw_affiliation_strings":["School of Mechanical and Aerospace Engineering, Rehabilitation Research Institute of Singapore, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-8785-5885","affiliations":[{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Rehabilitation Research Institute of Singapore, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5001918537"],"corresponding_institution_ids":["https://openalex.org/I50632499"],"apc_list":null,"apc_paid":null,"fwci":3.2294,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.93781938,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"26","issue":null,"first_page":"4039","last_page":"4049"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11227","display_name":"Diabetic Foot Ulcer Assessment and Management","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/2712","display_name":"Endocrinology, Diabetes and Metabolism"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8106875419616699},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7923307418823242},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5641918182373047},{"id":"https://openalex.org/keywords/spatial-correlation","display_name":"Spatial correlation","score":0.5249112844467163},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.4832042455673218},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.47720012068748474},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46790608763694763},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.45064103603363037},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36255893111228943},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32002031803131104},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07976531982421875}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8106875419616699},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7923307418823242},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5641918182373047},{"id":"https://openalex.org/C150060386","wikidata":"https://www.wikidata.org/wiki/Q7574054","display_name":"Spatial correlation","level":2,"score":0.5249112844467163},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.4832042455673218},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.47720012068748474},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46790608763694763},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.45064103603363037},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36255893111228943},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32002031803131104},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07976531982421875},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3321438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3321438","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3370211328","display_name":null,"funder_award_id":"62171251","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W2101032778","https://openalex.org/W2554247908","https://openalex.org/W2593146028","https://openalex.org/W2611932403","https://openalex.org/W2612706635","https://openalex.org/W2751690145","https://openalex.org/W2769237672","https://openalex.org/W2797184202","https://openalex.org/W2799211965","https://openalex.org/W2906502833","https://openalex.org/W2916798096","https://openalex.org/W2962824791","https://openalex.org/W2962896489","https://openalex.org/W2963225971","https://openalex.org/W2963598138","https://openalex.org/W2964221239","https://openalex.org/W2964318832","https://openalex.org/W2970285700","https://openalex.org/W2972662547","https://openalex.org/W2981660954","https://openalex.org/W2982627166","https://openalex.org/W3014509175","https://openalex.org/W3034448411","https://openalex.org/W3034581612","https://openalex.org/W3085139254","https://openalex.org/W3096609285","https://openalex.org/W3098473649","https://openalex.org/W3098612954","https://openalex.org/W3106838237","https://openalex.org/W3106882556","https://openalex.org/W3121523901","https://openalex.org/W3126541466","https://openalex.org/W3131500599","https://openalex.org/W3136525061","https://openalex.org/W3183950642","https://openalex.org/W3195639294","https://openalex.org/W3205327953","https://openalex.org/W3205873049","https://openalex.org/W4213019189","https://openalex.org/W4225557002","https://openalex.org/W4282964781","https://openalex.org/W4285259379","https://openalex.org/W4287177665","https://openalex.org/W4296355237","https://openalex.org/W4312249545","https://openalex.org/W4312417903","https://openalex.org/W4312797994","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6767176642","https://openalex.org/W6779089016","https://openalex.org/W6780226713","https://openalex.org/W6784333009","https://openalex.org/W6788135285","https://openalex.org/W6790375769","https://openalex.org/W6790690058","https://openalex.org/W6796761347","https://openalex.org/W6838740678"],"related_works":["https://openalex.org/W1950940422","https://openalex.org/W4283822356","https://openalex.org/W2129146436","https://openalex.org/W2032507829","https://openalex.org/W2147282173","https://openalex.org/W1988032185","https://openalex.org/W2898021863","https://openalex.org/W3003272824","https://openalex.org/W2521335480","https://openalex.org/W3121692546"],"abstract_inverted_index":{"Transformers":[0],"have":[1],"been":[2],"used":[3],"for":[4],"3D":[5],"human":[6,27,44],"pose":[7],"estimation":[8],"with":[9,128,150,178,193,210],"excellent":[10],"performance;":[11],"however,":[12],"most":[13],"transformers":[14],"focus":[15],"on":[16,34,157],"encoding":[17],"the":[18,26,35,43,60,79,91,108,117,167,173,186,203],"global":[19,80,92],"spatio-temporal":[20],"correlation":[21,38],"of":[22,39,83,95,113,169,175,189],"all":[23,84,96],"joints":[24,85],"in":[25,42,86,116,166],"body":[28],"and":[29,53,69,90,110,135,153,163,195],"there":[30],"are":[31,75,183],"few":[32],"studies":[33],"local":[36,118],"Spatio-temporal":[37,61],"each":[40,114,139],"joint":[41,115],"body.":[45],"In":[46],"this":[47],"article,":[48],"we":[49,122],"propose":[50,123],"a":[51,64,70,87,124],"Global":[52,65,71],"Local":[54,100],"Spatio-Temporal":[55,101],"Encoder":[56,67,73,102],"(GLSTE)":[57],"to":[58,77,106,131],"model":[59,204],"correlation.":[62],"Specifically,":[63],"Spatial":[66],"(GSE)":[68],"Temporal":[72],"(GTE)":[74],"constructed":[76,105],"capture":[78,107],"spatial":[81,109,134],"information":[82,94,112,137,209],"single":[88],"frame":[89],"temporal":[93,111,136],"frames,":[97],"respectively.":[98],"A":[99],"(LSTE)":[103],"is":[104],"N":[119],"frames.":[120],"Furthermore,":[121],"parallel":[125],"attention":[126],"module":[127],"weight":[129],"sharing":[130],"better":[132,184],"incorporate":[133],"into":[138],"node":[140],"simultaneously.":[141],"Extensive":[142],"experiments":[143],"show":[144],"that":[145,202],"GLSTE":[146],"outperforms":[147],"state-of-the-art":[148],"methods":[149,192],"fewer":[151],"parameters":[152],"less":[154],"computational":[155],"overhead":[156],"two":[158],"challenging":[159],"datasets:":[160],"Human3.6":[161,170],"M":[162,171],"MPI-INF-3DHP.":[164],"Especially":[165],"evaluation":[168],"dataset,":[172],"results":[174],"our":[176],"method":[177],"27":[179],"frames":[180,197],"as":[181,198],"input":[182],"than":[185],"vast":[187],"majority":[188],"recent":[190],"SOTA":[191],"81":[194],"243":[196],"input,":[199],"which":[200],"indicates":[201],"can":[205],"learn":[206],"more":[207],"useful":[208],"smaller":[211],"inputs.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":8}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
