{"id":"https://openalex.org/W3015483809","doi":"https://doi.org/10.1109/tip.2020.2984904","title":"STA-CNN: Convolutional Spatial-Temporal Attention Learning for Action Recognition","display_name":"STA-CNN: Convolutional Spatial-Temporal Attention Learning for Action Recognition","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3015483809","doi":"https://doi.org/10.1109/tip.2020.2984904","mag":"3015483809","pmid":"https://pubmed.ncbi.nlm.nih.gov/32275599"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2020.2984904","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2020.2984904","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100748251","display_name":"Hao Yang","orcid":"https://orcid.org/0000-0003-3590-4491"},"institutions":[{"id":"https://openalex.org/I4210141517","display_name":"Nuctech (China)","ror":"https://ror.org/057vhsp23","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210141517"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hao Yang","raw_affiliation_strings":["R&D Center of Artificial Intelligent, Nuctech Company Ltd., Beijing, China"],"affiliations":[{"raw_affiliation_string":"R&D Center of Artificial Intelligent, Nuctech Company Ltd., Beijing, China","institution_ids":["https://openalex.org/I4210141517"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005377211","display_name":"Chunfeng Yuan","orcid":"https://orcid.org/0000-0003-2219-4961"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunfeng Yuan","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100425669","display_name":"Li Zhang","orcid":"https://orcid.org/0000-0002-9321-3421"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Zhang","raw_affiliation_strings":["Department of Engineering Physics, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Engineering Physics, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100526684","display_name":"Yunda Sun","orcid":"https://orcid.org/0009-0000-3926-540X"},"institutions":[{"id":"https://openalex.org/I4210141517","display_name":"Nuctech (China)","ror":"https://ror.org/057vhsp23","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210141517"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunda Sun","raw_affiliation_strings":["R&D Center of Artificial Intelligent, Nuctech Company Ltd., Beijing, China"],"affiliations":[{"raw_affiliation_string":"R&D Center of Artificial Intelligent, Nuctech Company Ltd., Beijing, China","institution_ids":["https://openalex.org/I4210141517"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114549594","display_name":"Weiming Hu","orcid":"https://orcid.org/0000-0001-9237-8825"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiming Hu","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Science Center for Excellence in Brain Science and Intelligence Technology, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Science Center for Excellence in Brain Science and Intelligence Technology, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210097554","https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078239319","display_name":"Stephen J. Maybank","orcid":"https://orcid.org/0000-0003-2113-9119"},"institutions":[{"id":"https://openalex.org/I98259816","display_name":"Birkbeck, University of London","ror":"https://ror.org/02mb95055","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I98259816"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Stephen J. Maybank","raw_affiliation_strings":["Department of Computer Science and Information Systems, Birkbeck College, University of London, London, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Systems, Birkbeck College, University of London, London, U.K","institution_ids":["https://openalex.org/I98259816"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100748251"],"corresponding_institution_ids":["https://openalex.org/I4210141517"],"apc_list":null,"apc_paid":null,"fwci":5.2996,"has_fulltext":false,"cited_by_count":80,"citation_normalized_percentile":{"value":0.96601234,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"29","issue":null,"first_page":"5783","last_page":"5793"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.847392201423645},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.786605715751648},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7850035429000854},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7806739211082458},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6830853223800659},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.6145209670066833},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.4376704692840576},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42469507455825806},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4152244031429291},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3678719699382782},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1238783597946167}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.847392201423645},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.786605715751648},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7850035429000854},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7806739211082458},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6830853223800659},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.6145209670066833},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.4376704692840576},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42469507455825806},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4152244031429291},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3678719699382782},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1238783597946167}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tip.2020.2984904","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2020.2984904","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:32275599","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32275599","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null},{"id":"pmh:oai:eprints.bbk.ac.uk.oai2:31357","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306400466","display_name":"BIROn (Birkbeck, University of London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98259816","host_organization_name":"Birkbeck, University of London","host_organization_lineage":["https://openalex.org/I98259816"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7599999904632568,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G1477894522","display_name":null,"funder_award_id":"61472421","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2064497395","display_name":null,"funder_award_id":"61672519","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G247125729","display_name":null,"funder_award_id":"61472420","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3962180610","display_name":null,"funder_award_id":"61370185","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4306649430","display_name":null,"funder_award_id":"U1636218","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4391384632","display_name":null,"funder_award_id":"61472063","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4600069119","display_name":null,"funder_award_id":"61100099","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7184778669","display_name":null,"funder_award_id":"2017YFB1002801","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7625721555","display_name":null,"funder_award_id":"XDB02070003","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W764651262","https://openalex.org/W787785461","https://openalex.org/W874179280","https://openalex.org/W1484210532","https://openalex.org/W1514535095","https://openalex.org/W1522734439","https://openalex.org/W1686810756","https://openalex.org/W1744759976","https://openalex.org/W1821462560","https://openalex.org/W1899185266","https://openalex.org/W1977995219","https://openalex.org/W1983364832","https://openalex.org/W2016053056","https://openalex.org/W2064675550","https://openalex.org/W2097117768","https://openalex.org/W2108598243","https://openalex.org/W2126579184","https://openalex.org/W2133564696","https://openalex.org/W2147527908","https://openalex.org/W2156303437","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2235034809","https://openalex.org/W2295107390","https://openalex.org/W2308045930","https://openalex.org/W2339712187","https://openalex.org/W2342662179","https://openalex.org/W2398232863","https://openalex.org/W2401154299","https://openalex.org/W2467483865","https://openalex.org/W2472293097","https://openalex.org/W2505121268","https://openalex.org/W2508429489","https://openalex.org/W2554302513","https://openalex.org/W2594613244","https://openalex.org/W2612445135","https://openalex.org/W2734515856","https://openalex.org/W2779380177","https://openalex.org/W2798472916","https://openalex.org/W2886620625","https://openalex.org/W2898553394","https://openalex.org/W2941460356","https://openalex.org/W2950907316","https://openalex.org/W2951527505","https://openalex.org/W2962835968","https://openalex.org/W2962899219","https://openalex.org/W2962934715","https://openalex.org/W2963125010","https://openalex.org/W2963246338","https://openalex.org/W2963315828","https://openalex.org/W2963370182","https://openalex.org/W2963446712","https://openalex.org/W2963465031","https://openalex.org/W2963524571","https://openalex.org/W2963645879","https://openalex.org/W2963731876","https://openalex.org/W2963901033","https://openalex.org/W2963996492","https://openalex.org/W2964308564","https://openalex.org/W2980913109","https://openalex.org/W2992457155","https://openalex.org/W4288112001","https://openalex.org/W4294557331","https://openalex.org/W4297775537","https://openalex.org/W6600983433","https://openalex.org/W6622789128","https://openalex.org/W6628927728","https://openalex.org/W6630875275","https://openalex.org/W6637373629","https://openalex.org/W6637740493","https://openalex.org/W6638523607","https://openalex.org/W6679434410","https://openalex.org/W6682137061","https://openalex.org/W6682864246","https://openalex.org/W6684191040","https://openalex.org/W6684983439","https://openalex.org/W6724782142","https://openalex.org/W6737664043"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W147410782","https://openalex.org/W2900413183","https://openalex.org/W4390975304","https://openalex.org/W3022252430","https://openalex.org/W4287804464","https://openalex.org/W3103989898","https://openalex.org/W2965546495","https://openalex.org/W4401096132"],"abstract_inverted_index":{"Convolutional":[0,17,56],"Neural":[1,18,57],"Networks":[2,19],"have":[3,38],"achieved":[4],"excellent":[5],"successes":[6],"for":[7,24],"object":[8],"recognition":[9],"in":[10,27,95,123,156],"still":[11,46],"images.":[12,47],"However,":[13],"the":[14,21,34,62,69,104,119,129,152,157,164,170],"improvement":[15],"of":[16,169],"over":[20],"traditional":[22],"methods":[23],"recognizing":[25],"actions":[26,94],"videos":[28,36],"is":[29,135],"not":[30],"so":[31],"significant,":[32],"because":[33],"raw":[35],"usually":[37],"much":[39],"more":[40],"redundant":[41],"or":[42],"irrelevant":[43],"information":[44,122],"than":[45],"In":[48],"this":[49],"paper,":[50],"we":[51],"propose":[52],"a":[53,78,83,88,144],"Spatial-Temporal":[54],"Attentive":[55],"Network":[58],"(STA-CNN)":[59],"which":[60],"selects":[61],"discriminative":[63,105,153],"temporal":[64,106],"segments":[65,107],"and":[66,82,110,133,176],"focuses":[67],"on":[68,151,167],"informative":[70],"spatial":[71],"regions":[72,132,155],"automatically.":[73],"The":[74,97,113,160],"STA-CNN":[75,161],"model":[76,162],"incorporates":[77],"Temporal":[79,99],"Attention":[80,85,100,115],"Mechanism":[81,86,101,116],"Spatial":[84,114],"into":[87],"unified":[89],"convolutional":[90],"network":[91],"to":[92,127,149],"recognize":[93],"videos.":[96,112],"novel":[98],"automatically":[102],"mines":[103],"from":[108],"long":[109],"noisy":[111],"firstly":[117],"exploits":[118],"instantaneous":[120],"motion":[121,130],"optical":[124],"flow":[125],"features":[126],"locate":[128],"salient":[131],"it":[134],"then":[136],"trained":[137],"by":[138],"an":[139],"auxiliary":[140],"classification":[141],"loss":[142],"with":[143],"Global":[145],"Average":[146],"Pooling":[147],"layer":[148],"focus":[150],"non-motion":[154],"video":[158],"frame.":[159],"achieves":[163],"state-of-the-art":[165],"performance":[166],"two":[168],"most":[171],"challenging":[172],"datasets,":[173],"UCF-101":[174],"(95.8%)":[175],"HMDB-51":[177],"(71.5%).":[178]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":20},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
