{"id":"https://openalex.org/W7133483982","doi":"https://doi.org/10.3390/robotics15030054","title":"STAG-Net: A Lightweight Spatial\u2013Temporal Attention GCN for Real-Time 6D Human Pose Estimation in Human\u2013Robot Collaboration Scenarios","display_name":"STAG-Net: A Lightweight Spatial\u2013Temporal Attention GCN for Real-Time 6D Human Pose Estimation in Human\u2013Robot Collaboration Scenarios","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7133483982","doi":"https://doi.org/10.3390/robotics15030054"},"language":"en","primary_location":{"id":"doi:10.3390/robotics15030054","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics15030054","pdf_url":"https://www.mdpi.com/2218-6581/15/3/54/pdf?version=1772622809","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2218-6581/15/3/54/pdf?version=1772622809","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chunxin Yang","orcid":"https://orcid.org/0009-0009-8176-9068"},"institutions":[{"id":"https://openalex.org/I14396692","display_name":"Tokyo University of Information Sciences","ror":"https://ror.org/044bdx604","country_code":"JP","type":"education","lineage":["https://openalex.org/I14396692"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Chunxin Yang","raw_affiliation_strings":["Interfaculty Initiative in Information Studies, Graduate School of Interdisciplinary Information Studies, The University of Tokyo, Tokyo 113-0033, Japan"],"raw_orcid":"https://orcid.org/0009-0009-8176-9068","affiliations":[{"raw_affiliation_string":"Interfaculty Initiative in Information Studies, Graduate School of Interdisciplinary Information Studies, The University of Tokyo, Tokyo 113-0033, Japan","institution_ids":["https://openalex.org/I14396692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066074539","display_name":"Ruoyu Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ruoyu Jia","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan"],"raw_orcid":"https://orcid.org/0000-0002-6221-2899","affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108757059","display_name":"Qitong Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Qitong Guo","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan"],"raw_orcid":"https://orcid.org/0009-0002-9415-802X","affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiaohang Shi","orcid":"https://orcid.org/0009-0009-1565-238X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Xiaohang Shi","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan"],"raw_orcid":"https://orcid.org/0009-0009-1565-238X","affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo, Tokyo 113-0033, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101412704","display_name":"Masahiro Hirano","orcid":"https://orcid.org/0009-0005-4544-1955"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masahiro Hirano","raw_affiliation_strings":["Institute of Industrial Science, The University of Tokyo, Tokyo 153-8505, Japan"],"raw_orcid":"https://orcid.org/0009-0005-4544-1955","affiliations":[{"raw_affiliation_string":"Institute of Industrial Science, The University of Tokyo, Tokyo 153-8505, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128051017","display_name":"Yuji Yamakawa","orcid":null},"institutions":[{"id":"https://openalex.org/I14396692","display_name":"Tokyo University of Information Sciences","ror":"https://ror.org/044bdx604","country_code":"JP","type":"education","lineage":["https://openalex.org/I14396692"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuji Yamakawa","raw_affiliation_strings":["Graduate School of Interdisciplinary Information Studies, The University of Tokyo, Tokyo 113-0033, Japan"],"raw_orcid":"https://orcid.org/0000-0002-2880-7055","affiliations":[{"raw_affiliation_string":"Graduate School of Interdisciplinary Information Studies, The University of Tokyo, Tokyo 113-0033, Japan","institution_ids":["https://openalex.org/I14396692","https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I14396692"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.42907432,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"15","issue":"3","first_page":"54","last_page":"54"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9160000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9160000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.05730000138282776,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.006000000052154064,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7257000207901001},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.6862000226974487},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5619000196456909},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5465999841690063},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.5436999797821045},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.5436000227928162},{"id":"https://openalex.org/keywords/sensitivity","display_name":"Sensitivity (control systems)","score":0.453000009059906}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7357000112533569},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7257000207901001},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.6862000226974487},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.60589998960495},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5619000196456909},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5465999841690063},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.5436999797821045},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.5436000227928162},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.453000009059906},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4180000126361847},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.39329999685287476},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3237999975681305},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3181000053882599},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28760001063346863},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.27140000462532043},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.25609999895095825}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/robotics15030054","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics15030054","pdf_url":"https://www.mdpi.com/2218-6581/15/3/54/pdf?version=1772622809","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:50ee0de9d5414be88dbd2de2bcef8008","is_oa":true,"landing_page_url":"https://doaj.org/article/50ee0de9d5414be88dbd2de2bcef8008","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, Vol 15, Iss 3, p 54 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/robotics15030054","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics15030054","pdf_url":"https://www.mdpi.com/2218-6581/15/3/54/pdf?version=1772622809","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7133483982.pdf","grobid_xml":"https://content.openalex.org/works/W7133483982.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W2016959837","https://openalex.org/W2099333815","https://openalex.org/W2101032778","https://openalex.org/W2554247908","https://openalex.org/W2583585015","https://openalex.org/W2610034660","https://openalex.org/W2612706635","https://openalex.org/W2769237672","https://openalex.org/W2797184202","https://openalex.org/W2798646183","https://openalex.org/W2895689136","https://openalex.org/W2949924544","https://openalex.org/W2962896489","https://openalex.org/W2963076818","https://openalex.org/W2963995996","https://openalex.org/W2964016027","https://openalex.org/W2964221239","https://openalex.org/W2964318832","https://openalex.org/W2966735886","https://openalex.org/W2970285700","https://openalex.org/W2972662547","https://openalex.org/W3023681781","https://openalex.org/W3034448411","https://openalex.org/W3093002101","https://openalex.org/W3097623574","https://openalex.org/W3106882556","https://openalex.org/W3126541466","https://openalex.org/W3136525061","https://openalex.org/W3167491448","https://openalex.org/W3173811519","https://openalex.org/W3196805674","https://openalex.org/W3202716970","https://openalex.org/W3204956438","https://openalex.org/W4205556443","https://openalex.org/W4225557002","https://openalex.org/W4226057760","https://openalex.org/W4312249545","https://openalex.org/W4312845873","https://openalex.org/W4313068951","https://openalex.org/W4385801222","https://openalex.org/W4386076353","https://openalex.org/W4386076485","https://openalex.org/W4386083126","https://openalex.org/W4390873166","https://openalex.org/W4390874423","https://openalex.org/W4394597906","https://openalex.org/W4396747546","https://openalex.org/W4396857019","https://openalex.org/W4403488737","https://openalex.org/W4409186742"],"related_works":[],"abstract_inverted_index":{"Most":[0],"existing":[1],"research":[2],"in":[3,40,60,91,173],"human":[4,20],"pose":[5],"estimation":[6],"focuses":[7],"on":[8,82,186],"predicting":[9],"joint":[10,26,55,125],"positions,":[11],"paying":[12],"limited":[13],"attention":[14,115],"to":[15,47],"recovering":[16],"the":[17,143,191,196],"full":[18],"6D":[19],"pose,":[21],"which":[22,87,166],"comprises":[23],"both":[24],"3D":[25],"positions":[27,56,126],"and":[28,44,117,127,139,193],"bone":[29,64,128],"orientations.":[30,62],"Position-only":[31],"methods":[32,80],"treat":[33],"joints":[34],"as":[35,95],"independent":[36],"points,":[37],"often":[38],"resulting":[39],"structurally":[41],"implausible":[42],"poses":[43,51],"increased":[45],"sensitivity":[46],"depth":[48],"ambiguities\u2014cases":[49],"where":[50],"share":[52],"nearly":[53],"identical":[54],"but":[57],"differ":[58],"significantly":[59],"limb":[61],"Incorporating":[63],"orientation":[65],"information":[66],"helps":[67],"enforce":[68],"geometric":[69],"consistency,":[70],"yielding":[71],"more":[72],"anatomically":[73],"plausible":[74],"skeletal":[75,134],"structures.":[76],"Additionally,":[77],"many":[78],"state-of-the-art":[79],"rely":[81],"large,":[83],"computationally":[84,140],"expensive":[85],"models,":[86],"limit":[88],"their":[89],"applicability":[90],"real-time":[92],"scenarios,":[93],"such":[94],"human\u2013robot":[96],"collaboration.":[97],"In":[98,157],"this":[99],"work,":[100],"we":[101,159],"propose":[102],"STAG-Net,":[103],"a":[104,161,180],"novel":[105],"2D-to-6D":[106],"lifting":[107],"network":[108],"that":[109],"integrates":[110],"Graph":[111],"Convolutional":[112,119],"Networks":[113,120],"(GCNs),":[114],"mechanisms,":[116],"Temporal":[118],"(TCNs).":[121],"By":[122],"simultaneously":[123],"learning":[124],"orientations,":[129],"STAG-Net":[130,146],"promotes":[131],"geometrically":[132],"consistent":[133],"structures":[135],"while":[136,171],"remaining":[137],"lightweight":[138,162],"efficient.":[141],"On":[142],"Human3.6M":[144],"benchmark,":[145],"achieves":[147,167],"an":[148],"MPJPE":[149,170],"of":[150,195],"41.8":[151],"mm":[152,169],"using":[153,179],"243":[154],"input":[155],"frames.":[156],"addition,":[158],"introduce":[160],"single-frame":[163],"variant,":[164],"STG-Net,":[165],"50.8":[168],"operating":[172],"real":[174],"time":[175],"at":[176],"60":[177],"FPS":[178],"single":[181],"RGB":[182],"camera.":[183],"Extensive":[184],"experiments":[185],"multiple":[187],"large-scale":[188],"datasets":[189],"demonstrate":[190],"effectiveness":[192],"efficiency":[194],"proposed":[197],"approach.":[198]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-03-05T00:00:00"}
