{"id":"https://openalex.org/W3098155805","doi":"https://doi.org/10.3233/faia200754","title":"Hierarchy Spatial-Temporal Transformer for Action Recognition in Short Videos","display_name":"Hierarchy Spatial-Temporal Transformer for Action Recognition in Short Videos","publication_year":2020,"publication_date":"2020-11-09","ids":{"openalex":"https://openalex.org/W3098155805","doi":"https://doi.org/10.3233/faia200754","mag":"3098155805"},"language":"en","primary_location":{"id":"doi:10.3233/faia200754","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia200754","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA200754","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA200754","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029118616","display_name":"Guoyong Cai","orcid":"https://orcid.org/0000-0002-5705-1189"},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guoyong Cai","raw_affiliation_strings":["GuangXi Key Laboratory of Trusted Software, Guilin University of Electronic Technology, Guilin, China"],"affiliations":[{"raw_affiliation_string":"GuangXi Key Laboratory of Trusted Software, Guilin University of Electronic Technology, Guilin, China","institution_ids":["https://openalex.org/I5343935"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085652260","display_name":"Yumeng Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yumeng Cai","raw_affiliation_strings":["GuangXi Key Laboratory of Trusted Software, Guilin University of Electronic Technology, Guilin, China"],"affiliations":[{"raw_affiliation_string":"GuangXi Key Laboratory of Trusted Software, Guilin University of Electronic Technology, Guilin, China","institution_ids":["https://openalex.org/I5343935"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5029118616"],"corresponding_institution_ids":["https://openalex.org/I5343935"],"apc_list":null,"apc_paid":null,"fwci":0.1235,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.53316617,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13647","display_name":"AI and Big Data Applications","score":0.9743000268936157,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7275214195251465},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6763775944709778},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6128503680229187},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5215256810188293},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4979884624481201},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47009584307670593},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.41419267654418945},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08103376626968384}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7275214195251465},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6763775944709778},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6128503680229187},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5215256810188293},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4979884624481201},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47009584307670593},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.41419267654418945},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08103376626968384},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia200754","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia200754","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA200754","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia200754","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia200754","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA200754","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3098155805.pdf","grobid_xml":"https://content.openalex.org/works/W3098155805.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W28988658","https://openalex.org/W1522734439","https://openalex.org/W1686810756","https://openalex.org/W1983364832","https://openalex.org/W2016053056","https://openalex.org/W2097117768","https://openalex.org/W2126579184","https://openalex.org/W2194775991","https://openalex.org/W2394849137","https://openalex.org/W2593722617","https://openalex.org/W2597958930","https://openalex.org/W2604730366","https://openalex.org/W2619082050","https://openalex.org/W2724359148","https://openalex.org/W2761659801","https://openalex.org/W2770465006","https://openalex.org/W2770565591","https://openalex.org/W2772114784","https://openalex.org/W2779380177","https://openalex.org/W2799176631","https://openalex.org/W2922509574","https://openalex.org/W2962934715","https://openalex.org/W2963091558","https://openalex.org/W2963125010","https://openalex.org/W2963155035","https://openalex.org/W2963247196","https://openalex.org/W2963524571","https://openalex.org/W2963645879","https://openalex.org/W2963820951","https://openalex.org/W2964084343","https://openalex.org/W2964214371","https://openalex.org/W3095433202","https://openalex.org/W4237044863","https://openalex.org/W4385245566","https://openalex.org/W6674914833","https://openalex.org/W6687483927","https://openalex.org/W6739901393","https://openalex.org/W6746034047","https://openalex.org/W6760640297"],"related_works":["https://openalex.org/W2055243143","https://openalex.org/W4206178588","https://openalex.org/W4287635093","https://openalex.org/W3094491777","https://openalex.org/W3214715529","https://openalex.org/W4386159726","https://openalex.org/W2905271011","https://openalex.org/W3164948662","https://openalex.org/W4289536128","https://openalex.org/W3153597579"],"abstract_inverted_index":{"Short":[0],"videos":[1],"action":[2],"recognition":[3],"based":[4,21,77],"on":[5,22,78],"deep":[6],"learning":[7,120],"has":[8,36],"made":[9],"a":[10,37,56,112,147],"series":[11],"of":[12,16,40,66],"important":[13],"progress;":[14],"most":[15],"the":[17,64,103,133,156,164,171],"proposed":[18,165],"methods":[19],"are":[20],"3D":[23,34],"Convolution":[24],"neural":[25],"networks":[26,45],"(3D":[27],"CNN)":[28],"and":[29,42,62,82,98,158],"Two":[30,43,79],"Stream":[31,44,80],"architecture.":[32],"However,":[33],"CNN":[35],"large":[38],"number":[39],"parameters":[41],"cannot":[46],"learn":[47,59],"features":[48,61],"well":[49],"enough.":[50],"This":[51],"work":[52],"aims":[53],"to":[54,58,126,145],"build":[55],"network":[57],"better":[60,168],"reduce":[63],"scale":[65],"parameters.":[67],"A":[68],"Hierarchy":[69,92],"Spatial-Temporal":[70],"Transformer":[71],"model":[72,86,166],"is":[73,76,87,108,121,139],"proposed,":[74],"which":[75],"architecture":[81],"hierarchy":[83],"inference.":[84],"The":[85],"divided":[88],"into":[89,111],"three":[90],"modules:":[91],"Residual":[93],"Reformer,":[94],"Spatial":[95],"Attention":[96,100],"Module,":[97],"Temporal-Spatial":[99],"Module.":[101],"In":[102],"model,":[104],"each":[105],"frame\u2019s":[106],"image":[107],"firstly":[109],"transformed":[110],"spatial":[113,118,124,129,136],"visual":[114],"feature":[115,119,130,137,143],"map.":[116],"Secondly,":[117],"performed":[122],"by":[123],"attention":[125,128,135],"generating":[127],"maps.":[131],"Finally,":[132],"generated":[134],"map":[138],"incorporated":[140],"with":[141],"temporal":[142],"vectors":[144],"generate":[146],"final":[148],"representation":[149],"for":[150],"classification":[151],"experiments.":[152],"Experiment":[153],"results":[154],"in":[155],"hmdb51":[157],"ucf101":[159],"data":[160],"set":[161],"showed":[162],"that":[163],"achieved":[167],"accuracy":[169],"than":[170],"state-of-art":[172],"baseline":[173],"models":[174]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
