{"id":"https://openalex.org/W7125921522","doi":"https://doi.org/10.1109/smc58881.2025.11343686","title":"TTTFormer: Token Pruning-based Spatio-Temporal Topology Transformer for 3D Human Pose Estimation","display_name":"TTTFormer: Token Pruning-based Spatio-Temporal Topology Transformer for 3D Human Pose Estimation","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125921522","doi":"https://doi.org/10.1109/smc58881.2025.11343686"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11343686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343686","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100769848","display_name":"Yifu Li","orcid":"https://orcid.org/0000-0002-7077-7689"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yifu Li","raw_affiliation_strings":["Central South University,School of Computer Science and Engineering,Changsha,China,410075"],"affiliations":[{"raw_affiliation_string":"Central South University,School of Computer Science and Engineering,Changsha,China,410075","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101406800","display_name":"Jun Yu","orcid":"https://orcid.org/0000-0002-9142-0929"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxuan Yu","raw_affiliation_strings":["Central South University,School of Computer Science and Engineering,Changsha,China,410075"],"affiliations":[{"raw_affiliation_string":"Central South University,School of Computer Science and Engineering,Changsha,China,410075","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"last","author":{"id":null,"display_name":"Zhigang Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhigang Chen","raw_affiliation_strings":["Central South University,School of Computer Science and Engineering,Changsha,China,410075"],"affiliations":[{"raw_affiliation_string":"Central South University,School of Computer Science and Engineering,Changsha,China,410075","institution_ids":["https://openalex.org/I139660479"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100769848"],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70472409,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"848","last_page":"855"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.013899999670684338,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.009499999694526196,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6198999881744385},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5776000022888184},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5526000261306763},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5389000177383423},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.48179998993873596},{"id":"https://openalex.org/keywords/topology","display_name":"Topology (electrical circuits)","score":0.4781999886035919},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.396699994802475}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7289000153541565},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6198999881744385},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5776000022888184},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5526000261306763},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5389000177383423},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.48179998993873596},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.4781999886035919},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.396699994802475},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3675999939441681},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.3384999930858612},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3327000141143799},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3012000024318695},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.2833999991416931},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.2574000060558319}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11343686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343686","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2101032778","https://openalex.org/W2781181706","https://openalex.org/W2895689136","https://openalex.org/W2964221239","https://openalex.org/W2964318832","https://openalex.org/W2966735886","https://openalex.org/W2991247554","https://openalex.org/W2997288107","https://openalex.org/W3034581612","https://openalex.org/W3103184573","https://openalex.org/W3106838237","https://openalex.org/W3136525061","https://openalex.org/W3180037928","https://openalex.org/W3188906027","https://openalex.org/W4225557002","https://openalex.org/W4312249545","https://openalex.org/W4312417903","https://openalex.org/W4312614783","https://openalex.org/W4312797994","https://openalex.org/W4313068951","https://openalex.org/W4382457852","https://openalex.org/W4386083126","https://openalex.org/W4390873166","https://openalex.org/W4402715909","https://openalex.org/W4402727550"],"related_works":[],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"Transformer-based":[3],"methods":[4,19],"have":[5,20],"remained":[6],"the":[7,26,97,101,109,119,135,171],"dominant":[8],"approach":[9,155],"for":[10,44],"3D":[11,36,165],"human":[12],"pose":[13],"estimation":[14],"(3D":[15],"HPE).":[16],"While":[17],"these":[18],"achieved":[21],"continuous":[22],"improvements":[23],"in":[24,134,163],"accuracy,":[25],"inherently":[27],"high":[28,120],"computational":[29,121,152],"complexity":[30],"of":[31,63,100,123,193],"Transformer":[32,59],"modules":[33],"makes":[34],"current":[35],"HPE":[37,166],"models":[38],"excessively":[39],"resource-intensive,":[40],"rendering":[41],"them":[42],"impractical":[43],"deployment":[45],"on":[46,170],"resource-constrained":[47],"devices.":[48],"To":[49],"address":[50],"this":[51],"challenge,":[52],"we":[53,129],"propose":[54],"Token":[55,71,136],"Pruning-based":[56,72,137],"Spatio-Temporal":[57,65,73,138],"Topology":[58,66,91],"(TTTFormer),":[60],"which":[61,140],"consists":[62],"a":[64,70,89,131,157,191],"Encoder":[67],"(STTE)":[68],"and":[69,88,161,182,195],"Decoder.":[74],"The":[75,184],"STTE":[76,110],"incorporates":[77],"Spatial":[78],"Position":[79],"Embedding":[80],"(SPE)":[81],"to":[82,94,111,117,151],"model":[83,177,189],"spatial":[84],"correlations":[85],"between":[86,159],"joints":[87],"Temporal":[90],"Block":[92],"(TTB)":[93],"effectively":[95],"capture":[96],"temporal":[98],"relationships":[99],"same":[102],"joint":[103],"across":[104],"frames.":[105],"These":[106],"components":[107],"enable":[108],"extract":[112],"richer":[113],"spatio-temporal":[114],"features.":[115],"Furthermore,":[116],"mitigate":[118],"cost":[122],"transformers":[124],"when":[125],"handling":[126],"long":[127],"sequences,":[128],"introduce":[130],"lightweight":[132],"design":[133],"Decoder,":[139],"preserves":[141],"representative":[142],"tokens":[143],"while":[144],"discarding":[145],"redundant":[146],"ones":[147],"that":[148,175,187],"contribute":[149],"disproportionately":[150],"over-head.":[153],"This":[154],"achieves":[156,190],"balance":[158],"efficiency":[160,181],"accuracy":[162],"complex":[164],"tasks.":[167],"Extensive":[168],"experiments":[169],"Human3.6M":[172],"dataset":[173],"demonstrate":[174],"our":[176,188],"significantly":[178],"enhances":[179],"both":[180],"precision.":[183],"results":[185],"show":[186],"MPJPE":[192],"40.8mm":[194],"better":[196],"performance":[197],"with":[198],"364M":[199],"FLOPs":[200],"per":[201],"frame.":[202]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-01-29T00:00:00"}
