{"id":"https://openalex.org/W4283390251","doi":"https://doi.org/10.1007/s00530-022-00961-3","title":"Multi-head attention-based two-stream EfficientNet for action recognition","display_name":"Multi-head attention-based two-stream EfficientNet for action recognition","publication_year":2022,"publication_date":"2022-06-24","ids":{"openalex":"https://openalex.org/W4283390251","doi":"https://doi.org/10.1007/s00530-022-00961-3"},"language":"en","primary_location":{"id":"doi:10.1007/s00530-022-00961-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00530-022-00961-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00530-022-00961-3.pdf","source":{"id":"https://openalex.org/S112262039","display_name":"Multimedia Systems","issn_l":"0942-4962","issn":["0942-4962","1432-1882"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimedia Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00530-022-00961-3.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101131416","display_name":"Aihua Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I17442442","display_name":"State Grid Corporation of China (China)","ror":"https://ror.org/05twwhs70","country_code":"CN","type":"company","lineage":["https://openalex.org/I17442442"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aihua Zhou","raw_affiliation_strings":["State Grid Key Laboratory of Information and Network Security, Nanjing, China","State Grid Smart Grid Research Institute CO., LTD, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Key Laboratory of Information and Network Security, Nanjing, China","institution_ids":[]},{"raw_affiliation_string":"State Grid Smart Grid Research Institute CO., LTD, Beijing, China","institution_ids":["https://openalex.org/I17442442"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035467487","display_name":"Yujun Ma","orcid":"https://orcid.org/0000-0002-8014-0067"},"institutions":[{"id":"https://openalex.org/I51158804","display_name":"Massey University","ror":"https://ror.org/052czxv31","country_code":"NZ","type":"education","lineage":["https://openalex.org/I51158804"]}],"countries":["NZ"],"is_corresponding":true,"raw_author_name":"Yujun Ma","raw_affiliation_strings":["School of Mathematical and Computational Sciences, Massey University, Auckland, New Zealand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mathematical and Computational Sciences, Massey University, Auckland, New Zealand","institution_ids":["https://openalex.org/I51158804"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070396907","display_name":"Wanting Ji","orcid":"https://orcid.org/0000-0003-2406-3156"},"institutions":[{"id":"https://openalex.org/I118803816","display_name":"Liaoning University","ror":"https://ror.org/03xpwj629","country_code":"CN","type":"education","lineage":["https://openalex.org/I118803816"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wanting Ji","raw_affiliation_strings":["School of Information, Liaoning University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Information, Liaoning University, Shenyang, China","institution_ids":["https://openalex.org/I118803816"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101835777","display_name":"Ming Zong","orcid":"https://orcid.org/0000-0001-5425-6667"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Zong","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019594660","display_name":"Pei Yang","orcid":"https://orcid.org/0000-0001-8926-9695"},"institutions":[{"id":"https://openalex.org/I17442442","display_name":"State Grid Corporation of China (China)","ror":"https://ror.org/05twwhs70","country_code":"CN","type":"company","lineage":["https://openalex.org/I17442442"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pei Yang","raw_affiliation_strings":["State Grid Key Laboratory of Information and Network Security, Nanjing, China","State Grid Smart Grid Research Institute CO., LTD, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Key Laboratory of Information and Network Security, Nanjing, China","institution_ids":[]},{"raw_affiliation_string":"State Grid Smart Grid Research Institute CO., LTD, Beijing, China","institution_ids":["https://openalex.org/I17442442"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101860728","display_name":"Min Wu","orcid":"https://orcid.org/0009-0007-8206-3855"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Min Wu","raw_affiliation_strings":["Bejing Institute of Computer Technology and Applications, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bejing Institute of Computer Technology and Applications, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100674094","display_name":"Mingzhe Liu","orcid":"https://orcid.org/0000-0001-7054-997X"},"institutions":[{"id":"https://openalex.org/I31595395","display_name":"Chengdu University of Technology","ror":"https://ror.org/05pejbw21","country_code":"CN","type":"education","lineage":["https://openalex.org/I31595395"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingzhe Liu","raw_affiliation_strings":["State Key Laboratory of Geohazard Prevention and Geo-Environment Protection, Chengdu University of Technology, Chengdu, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Geohazard Prevention and Geo-Environment Protection, Chengdu University of Technology, Chengdu, China","institution_ids":["https://openalex.org/I31595395"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5035467487"],"corresponding_institution_ids":["https://openalex.org/I51158804"],"apc_list":null,"apc_paid":null,"fwci":4.6694,"has_fulltext":true,"cited_by_count":55,"citation_normalized_percentile":{"value":0.96068491,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"29","issue":"2","first_page":"487","last_page":"498"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8407350778579712},{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.6944032311439514},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5706269145011902},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5643336772918701},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5513795614242554},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5374771356582642},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5213157534599304},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4707256853580475},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.45461782813072205}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8407350778579712},{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.6944032311439514},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5706269145011902},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5643336772918701},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5513795614242554},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5374771356582642},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5213157534599304},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4707256853580475},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.45461782813072205},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00530-022-00961-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00530-022-00961-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00530-022-00961-3.pdf","source":{"id":"https://openalex.org/S112262039","display_name":"Multimedia Systems","issn_l":"0942-4962","issn":["0942-4962","1432-1882"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimedia Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00530-022-00961-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00530-022-00961-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00530-022-00961-3.pdf","source":{"id":"https://openalex.org/S112262039","display_name":"Multimedia Systems","issn_l":"0942-4962","issn":["0942-4962","1432-1882"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimedia Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320816","display_name":"Massey University","ror":"https://ror.org/052czxv31"},{"id":"https://openalex.org/F4320326707","display_name":"State Grid Corporation of China","ror":"https://ror.org/05twwhs70"},{"id":"https://openalex.org/F4320335967","display_name":"Science and Technology Project of State Grid","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4283390251.pdf","grobid_xml":"https://content.openalex.org/works/W4283390251.grobid-xml"},"referenced_works_count":59,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1522734439","https://openalex.org/W1944615693","https://openalex.org/W1947481528","https://openalex.org/W1981781955","https://openalex.org/W1983364832","https://openalex.org/W2021829585","https://openalex.org/W2105101328","https://openalex.org/W2108598243","https://openalex.org/W2126579184","https://openalex.org/W2194775991","https://openalex.org/W2235034809","https://openalex.org/W2267186426","https://openalex.org/W2342662179","https://openalex.org/W2507009361","https://openalex.org/W2743317799","https://openalex.org/W2770446450","https://openalex.org/W2892189026","https://openalex.org/W2909973745","https://openalex.org/W2946820375","https://openalex.org/W2946948417","https://openalex.org/W2951454267","https://openalex.org/W2962899219","https://openalex.org/W2963163009","https://openalex.org/W2963218601","https://openalex.org/W2963465031","https://openalex.org/W2963524571","https://openalex.org/W2963563276","https://openalex.org/W2963645879","https://openalex.org/W2963731876","https://openalex.org/W2963820951","https://openalex.org/W2963886665","https://openalex.org/W2964191259","https://openalex.org/W2965521953","https://openalex.org/W2990541775","https://openalex.org/W2996298259","https://openalex.org/W2998384080","https://openalex.org/W2999794487","https://openalex.org/W3013853001","https://openalex.org/W3022398175","https://openalex.org/W3035526303","https://openalex.org/W3036066034","https://openalex.org/W3042064084","https://openalex.org/W3045856199","https://openalex.org/W3047725879","https://openalex.org/W3081260473","https://openalex.org/W3082283937","https://openalex.org/W3090628358","https://openalex.org/W3107664750","https://openalex.org/W3115205610","https://openalex.org/W3119627071","https://openalex.org/W3128936536","https://openalex.org/W3173621652","https://openalex.org/W3185888983","https://openalex.org/W3185917994","https://openalex.org/W4200621741","https://openalex.org/W4210900105","https://openalex.org/W4214516465","https://openalex.org/W4312775149"],"related_works":["https://openalex.org/W3107204728","https://openalex.org/W4287591324","https://openalex.org/W4226420367","https://openalex.org/W2980176872","https://openalex.org/W2962876041","https://openalex.org/W3090555870","https://openalex.org/W3108503355","https://openalex.org/W2899027234","https://openalex.org/W3095506574","https://openalex.org/W3190449293"],"abstract_inverted_index":{"Abstract":[0],"Recent":[1],"years":[2],"have":[3],"witnessed":[4],"the":[5,60,84,103,108,113,128,142,151,163,167,177],"popularity":[6],"of":[7,27,59,64,70,131],"using":[8,93],"two-stream":[9,18],"convolutional":[10,19],"neural":[11,20],"networks":[12],"for":[13,52,183],"action":[14,22,53,110,144,184],"recognition.":[15,185],"However,":[16],"existing":[17],"network-based":[21],"recognition":[23],"approaches":[24,182],"are":[25],"incapable":[26],"distinguishing":[28],"some":[29],"roughly":[30],"similar":[31,159],"actions":[32],"in":[33,155],"videos":[34],"such":[35],"as":[36],"sneezing":[37],"and":[38,77,86,133,149,170],"yawning.":[39],"To":[40],"solve":[41],"this":[42],"problem,":[43],"we":[44],"propose":[45],"a":[46,74,78,96,122],"Multi-head":[47],"Attention-based":[48],"Two-stream":[49],"EfficientNet":[50],"(MAT-EffNet)":[51],"recognition,":[54],"which":[55,81,126],"can":[56,139],"take":[57],"advantage":[58],"efficient":[61],"feature":[62],"extraction":[63],"EfficientNet.":[65,94],"The":[66,116,136],"proposed":[67,137,164],"network":[68,165],"consists":[69],"two":[71,104],"streams":[72,105],"(i.e.,":[73],"spatial":[75,85,132],"stream":[76],"temporal":[79,87,134],"stream),":[80],"first":[82],"extract":[83],"features":[88],"from":[89,112],"consecutive":[90],"frames":[91,148],"by":[92],"Then,":[95],"multi-head":[97],"attention":[98,152],"mechanism":[99],"is":[100,119],"utilized":[101],"on":[102,141,166],"to":[106,157],"capture":[107],"key":[109,143],"information":[111,145],"extracted":[114],"features.":[115],"final":[117],"prediction":[118],"obtained":[120],"via":[121],"late":[123],"average":[124],"fusion,":[125],"averages":[127],"softmax":[129],"score":[130],"streams.":[135],"MAT-EffNet":[138,178],"focus":[140],"at":[146],"different":[147],"compute":[150],"multiple":[153],"times,":[154],"parallel,":[156],"distinguish":[158],"actions.":[160],"We":[161],"test":[162],"UCF101,":[168],"HMDB51":[169],"Kinetics-400":[171],"datasets.":[172],"Experimental":[173],"results":[174],"show":[175],"that":[176],"outperforms":[179],"other":[180],"state-of-the-art":[181]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":20},{"year":2023,"cited_by_count":8}],"updated_date":"2026-06-02T09:04:35.204637","created_date":"2025-10-10T00:00:00"}
