{"id":"https://openalex.org/W4401991044","doi":"https://doi.org/10.1109/icmew63481.2024.10645423","title":"A Survey on Backbones for Deep Video Action Recognition","display_name":"A Survey on Backbones for Deep Video Action Recognition","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4401991044","doi":"https://doi.org/10.1109/icmew63481.2024.10645423"},"language":"en","primary_location":{"id":"doi:10.1109/icmew63481.2024.10645423","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101410184","display_name":"Zixuan Tang","orcid":"https://orcid.org/0000-0002-7394-8666"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zixuan Tang","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039534380","display_name":"Youjun Zhao","orcid":"https://orcid.org/0009-0002-6507-1099"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youjun Zhao","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074489530","display_name":"Yuhang Wen","orcid":"https://orcid.org/0000-0001-6644-4075"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhang Wen","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University,Shenzhen,China,518107","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103181239","display_name":"Meng\u2010Yuan Liu","orcid":"https://orcid.org/0000-0001-6100-8741"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyuan Liu","raw_affiliation_strings":["Peking University, Shenzhen Graduate School,National Key Laboratory of General Artificial Intelligence,Shenzhen,China,518055"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peking University, Shenzhen Graduate School,National Key Laboratory of General Artificial Intelligence,Shenzhen,China,518055","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101410184"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":0.9304,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.75862069,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.69378262758255},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6804965734481812},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.47983404994010925},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4701291024684906},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3651975393295288}],"concepts":[{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.69378262758255},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6804965734481812},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.47983404994010925},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4701291024684906},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3651975393295288},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmew63481.2024.10645423","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5","score":0.5799999833106995}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W874179280","https://openalex.org/W1522734439","https://openalex.org/W1744759976","https://openalex.org/W1944615693","https://openalex.org/W1983364832","https://openalex.org/W2016053056","https://openalex.org/W2126579184","https://openalex.org/W2156303437","https://openalex.org/W2312646659","https://openalex.org/W2507009361","https://openalex.org/W2556024076","https://openalex.org/W2580899942","https://openalex.org/W2608988379","https://openalex.org/W2619947201","https://openalex.org/W2625366777","https://openalex.org/W2883429621","https://openalex.org/W2904122085","https://openalex.org/W2962934715","https://openalex.org/W2963091558","https://openalex.org/W2963155035","https://openalex.org/W2963524571","https://openalex.org/W2963820951","https://openalex.org/W2990152177","https://openalex.org/W2990503944","https://openalex.org/W3034572008","https://openalex.org/W3126721948","https://openalex.org/W3137120824","https://openalex.org/W3138516171","https://openalex.org/W3170860705","https://openalex.org/W3210279979","https://openalex.org/W4211092666","https://openalex.org/W4214612132","https://openalex.org/W4214614183","https://openalex.org/W4236965008","https://openalex.org/W4246193833","https://openalex.org/W4287122452","https://openalex.org/W4310921506","https://openalex.org/W4312560592","https://openalex.org/W4312658081","https://openalex.org/W4312772544","https://openalex.org/W4386057769","https://openalex.org/W4386076625","https://openalex.org/W4389116311","https://openalex.org/W6682864246","https://openalex.org/W6750211549","https://openalex.org/W6790307280","https://openalex.org/W6797206543","https://openalex.org/W6797263693","https://openalex.org/W6853398349"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Action":[0],"recognition":[1,20,52],"is":[2,106],"a":[3,137],"key":[4],"technology":[5],"in":[6,18,63,74,94,131],"building":[7],"interactive":[8],"metaverses.":[9],"With":[10],"the":[11,30,39,115],"rapid":[12],"development":[13],"of":[14,41,97],"deep":[15,56],"learning,":[16],"methods":[17,42,53,62],"action":[19,51],"have":[21],"also":[22],"achieved":[23],"great":[24],"advancement.":[25],"Researchers":[26],"design":[27],"and":[28,43,69,81,124,134],"implement":[29],"backbones":[31],"referring":[32],"to":[33,38],"multiple":[34],"standpoints,":[35],"which":[36,91,113],"leads":[37],"diversity":[40],"encountering":[44],"new":[45],"challenges.":[46],"This":[47],"paper":[48],"reviews":[49],"several":[50],"based":[54],"on":[55],"neural":[57],"networks.":[58],"We":[59,127],"introduce":[60,114],"these":[61],"three":[64],"parts:":[65],"1)":[66],"Two-Streams":[67],"networks":[68],"their":[70],"variants,":[71],"which,":[72],"specifically":[73],"this":[75,132],"paper,":[76],"use":[77],"RGB":[78,98],"video":[79,125],"frame":[80],"optical":[82],"flow":[83],"modality":[84,99],"as":[85],"input;":[86],"2)":[87],"3D":[88],"convolutional":[89],"networks,":[90],"make":[92],"efforts":[93],"taking":[95],"advantage":[96],"directly":[100],"while":[101],"extracting":[102],"different":[103],"motion":[104],"information":[105],"no":[107],"longer":[108],"necessary;":[109],"3)":[110],"Transformer-based":[111],"methods,":[112],"model":[116],"from":[117],"natural":[118],"language":[119],"processing":[120],"into":[121],"computer":[122],"vision":[123],"understanding.":[126],"offer":[128],"objective":[129],"sights":[130],"review":[133],"hopefully":[135],"provide":[136],"reference":[138],"for":[139],"future":[140],"research.":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
