{"id":"https://openalex.org/W4391408867","doi":"https://doi.org/10.1145/3627631.3627640","title":"STTGC-Net: Spatial-Temporal Transformer with Graph Convolution for Skeleton-Based Action Recognition","display_name":"STTGC-Net: Spatial-Temporal Transformer with Graph Convolution for Skeleton-Based Action Recognition","publication_year":2023,"publication_date":"2023-12-15","ids":{"openalex":"https://openalex.org/W4391408867","doi":"https://doi.org/10.1145/3627631.3627640"},"language":"en","primary_location":{"id":"doi:10.1145/3627631.3627640","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627631.3627640","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fourteenth Indian Conference on Computer Vision, Graphics and Image Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093834073","display_name":"Tanishka Yagneshwar","orcid":"https://orcid.org/0009-0008-7470-1578"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tanishka Yagneshwar","raw_affiliation_strings":["Computer Science and Engineering, Shiv Nadar Institute of Eminence, IN"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Shiv Nadar Institute of Eminence, IN","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070435685","display_name":"Snehasis Mukherjee","orcid":"https://orcid.org/0000-0002-2196-8980"},"institutions":[{"id":"https://openalex.org/I26604189","display_name":"Shiv Nadar University","ror":"https://ror.org/05aqahr97","country_code":"IN","type":"education","lineage":["https://openalex.org/I26604189"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Snehasis Mukherjee","raw_affiliation_strings":["Computer Science and Engineering, Shiv Nadar Institute of Eminence, Greater Noida, India, IN"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Shiv Nadar Institute of Eminence, Greater Noida, India, IN","institution_ids":["https://openalex.org/I26604189"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5093834073"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2456,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.5579811,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.740143358707428},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5700982809066772},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.5601530075073242},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49954748153686523},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4833950102329254},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.48124027252197266},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4354478120803833},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2764151990413666},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.14278194308280945},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.095905601978302},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.06049090623855591},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.05839329957962036}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.740143358707428},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5700982809066772},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.5601530075073242},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49954748153686523},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4833950102329254},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.48124027252197266},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4354478120803833},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2764151990413666},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.14278194308280945},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.095905601978302},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.06049090623855591},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.05839329957962036},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3627631.3627640","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627631.3627640","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fourteenth Indian Conference on Computer Vision, Graphics and Image Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2048821851","https://openalex.org/W2056898157","https://openalex.org/W2183161252","https://openalex.org/W2284126738","https://openalex.org/W2558333741","https://openalex.org/W2606294640","https://openalex.org/W2607707631","https://openalex.org/W2716916105","https://openalex.org/W2751841288","https://openalex.org/W2792140610","https://openalex.org/W2793547936","https://openalex.org/W2944006115","https://openalex.org/W2948058585","https://openalex.org/W2948246283","https://openalex.org/W2948729509","https://openalex.org/W2962730651","https://openalex.org/W2963076818","https://openalex.org/W2964134613","https://openalex.org/W2966210862","https://openalex.org/W2978884181","https://openalex.org/W3034999503","https://openalex.org/W3035050855","https://openalex.org/W3035149912","https://openalex.org/W3035225512","https://openalex.org/W3049455300","https://openalex.org/W3081111248","https://openalex.org/W3093411241","https://openalex.org/W3096609285","https://openalex.org/W3106615203","https://openalex.org/W3120179362","https://openalex.org/W3153880451","https://openalex.org/W3170841864","https://openalex.org/W3174836262","https://openalex.org/W3203634062","https://openalex.org/W3205898195","https://openalex.org/W4205432963","https://openalex.org/W4214612132","https://openalex.org/W4221166048","https://openalex.org/W4295957147","https://openalex.org/W4320015918","https://openalex.org/W4324119270","https://openalex.org/W4380997409","https://openalex.org/W4386065445"],"related_works":["https://openalex.org/W2182785089","https://openalex.org/W4312178642","https://openalex.org/W4387838477","https://openalex.org/W2067193074","https://openalex.org/W4303411729","https://openalex.org/W2965803933","https://openalex.org/W4211202157","https://openalex.org/W4283332100","https://openalex.org/W4361193049","https://openalex.org/W4287181611"],"abstract_inverted_index":{"Skeleton":[0],"data":[1,67],"plays":[2],"an":[3,126,190],"important":[4],"role":[5],"in":[6,81,102,144,167,249],"human":[7,18],"action":[8,26,143,146],"recognition":[9,27],"due":[10,31,61],"to":[11,32,62,65,138,220],"the":[12,22,33,43,96,110,115,122,145,164,168,176,179,222,239,244,257,261,273],"compact":[13],"and":[14,85,105,119,136,205,212,231,238,263,276],"distinct":[15],"information":[16,174,234],"of":[17,35,46,114,121,260],"poses":[19],"provided":[20],"by":[21,269],"skeleton":[23,59,93],"data.":[24],"Skeleton-based":[25],"is":[28,286],"gaining":[29],"interest":[30],"availability":[34],"Kinect":[36],"cameras":[37],"at":[38,235],"a":[39,141,159],"reasonable":[40],"price.":[41],"With":[42],"growing":[44],"popularity":[45],"Geometric":[47],"deep":[48],"learning,":[49],"Graph":[50,75,197,209],"Convolutional":[51,76,210],"networks":[52],"(GCN)":[53],"are":[54,79,217],"extensively":[55],"used":[56],"for":[57],"processing":[58],"data,":[60,90,169],"their":[63],"ability":[64],"model":[66,268],"topology.":[68],"It":[69],"has":[70],"been":[71],"found":[72],"that":[73,129,200],"Spatial-Temporal":[74,193,208,213],"Networks":[77,211],"(ST-GCN)":[78],"efficient":[80],"learning":[82],"both":[83],"spatial":[84,116],"temporal":[86,228],"dependencies":[87],"on":[88,140,272],"non-Euclidean":[89],"such":[91],"as":[92],"graphs.":[94],"However,":[95,156],"state-of-the-art":[97,282],"ST-GCN":[98],"models":[99],"lack":[100,125],"flexibility":[101],"feature":[103],"extraction":[104],"do":[106],"not":[107],"explicitly":[108],"consider":[109],"high-order":[111],"Spatio-Temporal":[112],"significance":[113],"connection":[117],"topology":[118,251],"intensity":[120],"joints.":[123],"They":[124],"attention":[127,241],"module":[128,242],"can":[130,151,171,201],"help":[131],"us":[132],"learn":[133],"together":[134],"when":[135],"where":[137],"concentrate":[139],"certain":[142],"sequence.":[147],"The":[148,225,284],"transformer-based":[149],"methods":[150],"effectively":[152],"capture":[153,203,227],"long-distance":[154],"dependencies.":[155],"using":[157],"just":[158],"traditional":[160],"transformer":[161,240],"approach":[162],"overlooks":[163],"graph":[165],"structure":[166],"which":[170,255,280],"provide":[172],"valuable":[173],"about":[175],"inter-relationships":[177],"among":[178],"joint":[180,247],"points":[181],"during":[182],"actions.":[183],"To":[184],"address":[185],"this":[186],"problem,":[187],"we":[188],"propose":[189],"architecture":[191],"named":[192],"Transformer":[194,214],"Network":[195],"with":[196],"Convolution":[198],"(STTGC-Net),":[199],"flexibly":[202],"local":[204,232],"global":[206,250],"contexts.":[207],"Attention":[215],"Modules":[216],"sequentially":[218],"fused":[219],"create":[221],"proposed":[223],"framework.":[224],"ST-GCNs":[226],"dynamics,":[229],"hierarchy,":[230],"topological":[233],"several":[236],"levels,":[237],"displays":[243],"correlations":[245],"between":[246],"pairs":[248],"via":[252],"dynamic":[253],"attention,":[254],"resolves":[256],"mentioned":[258],"constraints":[259],"GCN":[262],"transformer.":[264],"We":[265],"validate":[266],"our":[267],"conducting":[270],"tests":[271],"NTU":[274,277],"60":[275],"120":[278],"datasets,":[279],"achieve":[281],"performance.":[283],"code":[285],"available":[287],"through":[288],"github.":[289]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
