{"id":"https://openalex.org/W2970564558","doi":"https://doi.org/10.1109/icip.2019.8803586","title":"Spatial Temporal Attentional Glimpse for Human Activity Classification in Video","display_name":"Spatial Temporal Attentional Glimpse for Human Activity Classification in Video","publication_year":2019,"publication_date":"2019-08-26","ids":{"openalex":"https://openalex.org/W2970564558","doi":"https://doi.org/10.1109/icip.2019.8803586","mag":"2970564558"},"language":"en","primary_location":{"id":"doi:10.1109/icip.2019.8803586","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip.2019.8803586","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053389316","display_name":"Jiangtao Kong","orcid":null},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiangtao Kong","raw_affiliation_strings":["Beijing University of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing University of Technology","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082235101","display_name":"Rongchao Xu","orcid":"https://orcid.org/0000-0002-1542-5162"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongchao Xu","raw_affiliation_strings":["Beijing University of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing University of Technology","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076090670","display_name":"Junliang Xing","orcid":"https://orcid.org/0000-0001-6801-0510"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junliang Xing","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100399953","display_name":"Kai Li","orcid":"https://orcid.org/0000-0002-9027-0914"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Li","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100392071","display_name":"W. F. Mader","orcid":"https://orcid.org/0000-0002-7344-998X"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Ma","raw_affiliation_strings":["Beijing University of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing University of Technology","institution_ids":["https://openalex.org/I37796252"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5053389316"],"corresponding_institution_ids":["https://openalex.org/I37796252"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08432369,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":null,"first_page":"4040","last_page":"4044"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8053982257843018},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.7856314182281494},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.6848978996276855},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6226860880851746},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4936445951461792},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44986841082572937},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.43804579973220825},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4164232611656189},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3904265761375427},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1701982319355011},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06945738196372986}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8053982257843018},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.7856314182281494},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.6848978996276855},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6226860880851746},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4936445951461792},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44986841082572937},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.43804579973220825},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4164232611656189},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3904265761375427},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1701982319355011},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06945738196372986},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip.2019.8803586","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip.2019.8803586","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.4099999964237213}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W1600744878","https://openalex.org/W1799366690","https://openalex.org/W1836465849","https://openalex.org/W1980287119","https://openalex.org/W2002096058","https://openalex.org/W2072566913","https://openalex.org/W2097073572","https://openalex.org/W2144513243","https://openalex.org/W2156303437","https://openalex.org/W2162897826","https://openalex.org/W2194775991","https://openalex.org/W2619947201","https://openalex.org/W2752782242","https://openalex.org/W2949117887","https://openalex.org/W2963091558","https://openalex.org/W2963403868","https://openalex.org/W2963524571","https://openalex.org/W4385245566","https://openalex.org/W6638444622","https://openalex.org/W6638667902","https://openalex.org/W6681151457","https://openalex.org/W6682864246","https://openalex.org/W6739901393","https://openalex.org/W6743731764","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W147410782","https://openalex.org/W2900413183","https://openalex.org/W4390975304","https://openalex.org/W3022252430","https://openalex.org/W4287804464","https://openalex.org/W3103989898","https://openalex.org/W3211292372","https://openalex.org/W2810679507"],"abstract_inverted_index":{"Recently,":[0],"the":[1,7,11,29,44,69,93,132,137,140,143,146,150],"Convolutional":[2],"Networks":[3],"(ConvNet)":[4],"has":[5],"become":[6],"dominated":[8],"approach":[9],"to":[10,64,71,114,125,157],"human":[12],"activity":[13],"classification":[14],"problem.":[15,163],"We":[16,120],"investigate":[17],"current":[18],"standard":[19],"ConvNet":[20],"architectures":[21],"and":[22,101,116,149],"pinpoint":[23],"one":[24],"of":[25],"their":[26,104],"main":[27],"limitations:":[28],"spatial-temporal":[30,48,85],"dependency":[31],"is":[32,75,80,111],"simply":[33],"captured":[34],"by":[35,83],"global":[36],"pooling":[37],"operation,":[38],"which":[39,79],"may":[40],"not":[41],"well":[42],"capture":[43],"complex":[45],"long":[46],"term":[47],"relationships":[49],"in":[50,118],"videos.":[51],"For":[52],"this":[53,66,72,162],"work,":[54],"we":[55],"propose":[56],"a":[57,76,84],"Spatial":[58,88],"Temporal":[59,89],"Attentional":[60],"Glimpse":[61,90],"(STAG)":[62],"module":[63,74,110],"overcome":[65],"shortcoming.":[67],"Specifically,":[68],"input":[70],"STAG":[73,109,133],"3D":[77],"tensor":[78,95],"first":[81],"processed":[82],"attention":[86],"block.":[87],"block":[91,134],"decomposes":[92],"resulting":[94],"into":[96],"two":[97],"low":[98],"dimensional":[99],"tensors":[100],"then":[102],"fuses":[103],"operation":[105],"results.":[106],"The":[107],"proposed":[108],"pluggable,":[112],"easy":[113],"learn,":[115],"effective":[117],"computation.":[119],"conduct":[121],"extended":[122],"ablation":[123],"studies":[124,160],"show":[126],"that":[127],"our":[128],"model":[129],"incorporated":[130],"with":[131],"substantially":[135],"improves":[136],"performance":[138],"over":[139],"state-of-the-art.":[141],"All":[142],"experimental":[144],"results,":[145],"trained":[147],"models,":[148],"complete":[151],"source":[152],"codes":[153],"will":[154],"be":[155],"released":[156],"facilitate":[158],"further":[159],"on":[161]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
