{"id":"https://openalex.org/W3045186380","doi":"https://doi.org/10.1109/tpami.2021.3076522","title":"Depthwise Spatio-Temporal STFT Convolutional Neural Networks for Human Action Recognition","display_name":"Depthwise Spatio-Temporal STFT Convolutional Neural Networks for Human Action Recognition","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3045186380","doi":"https://doi.org/10.1109/tpami.2021.3076522","mag":"3045186380","pmid":"https://pubmed.ncbi.nlm.nih.gov/33914681"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2021.3076522","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3076522","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"preprint","indexed_in":["crossref","datacite","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://export.arxiv.org/pdf/2007.11365","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061474465","display_name":"Sudhakar Kumawat","orcid":"https://orcid.org/0000-0002-6057-2276"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Sudhakar Kumawat","raw_affiliation_strings":["Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: sudhakar.bm07@gmail.com)","[Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: sudhakar.bm07@gmail.com)]"],"affiliations":[{"raw_affiliation_string":"Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: sudhakar.bm07@gmail.com)","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"[Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: sudhakar.bm07@gmail.com)]","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101503357","display_name":"Manisha Verma","orcid":"https://orcid.org/0000-0002-5202-4325"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Manisha Verma","raw_affiliation_strings":["Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: mverma@ids.osaka-u.ac.jp)","[Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: mverma@ids.osaka-u.ac.jp)]"],"affiliations":[{"raw_affiliation_string":"Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: mverma@ids.osaka-u.ac.jp)","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"[Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: mverma@ids.osaka-u.ac.jp)]","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065649079","display_name":"Yuta Nakashima","orcid":"https://orcid.org/0000-0001-8000-3567"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuta Nakashima","raw_affiliation_strings":["Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: n-yuta@ids.osaka-u.ac.jp)"],"affiliations":[{"raw_affiliation_string":"Institute for Datability Science, Osaka University, 13013 Suita, Osaka, Japan, (e-mail: n-yuta@ids.osaka-u.ac.jp)","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070142969","display_name":"Shanmuganathan Raman","orcid":"https://orcid.org/0000-0003-2718-7891"},"institutions":[{"id":"https://openalex.org/I27674431","display_name":"Indian Institute of Technology Gandhinagar","ror":"https://ror.org/0036p5w23","country_code":"IN","type":"education","lineage":["https://openalex.org/I27674431"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shanmuganathan Raman","raw_affiliation_strings":["Electrical Engineering, Indian Institute of Technology Gandhinagar, 242275 Gandhinagar, Gujarat, India, 382355 (e-mail: shanmuga@iitgn.ac.in)"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering, Indian Institute of Technology Gandhinagar, 242275 Gandhinagar, Gujarat, India, 382355 (e-mail: shanmuga@iitgn.ac.in)","institution_ids":["https://openalex.org/I27674431"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5061474465"],"corresponding_institution_ids":["https://openalex.org/I98285908"],"apc_list":null,"apc_paid":null,"fwci":0.51109739,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.62887371,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"44","issue":"9","first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7715198993682861},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7362276315689087},{"id":"https://openalex.org/keywords/short-time-fourier-transform","display_name":"Short-time Fourier transform","score":0.7222627401351929},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7042685747146606},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6975623965263367},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6761324405670166},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.658297598361969},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5838606357574463},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5184563994407654},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.48639658093452454},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.42983508110046387},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42376774549484253},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.19731876254081726},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1587125062942505},{"id":"https://openalex.org/keywords/fourier-analysis","display_name":"Fourier analysis","score":0.05892753601074219}],"concepts":[{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7715198993682861},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7362276315689087},{"id":"https://openalex.org/C166386157","wikidata":"https://www.wikidata.org/wiki/Q1477735","display_name":"Short-time Fourier transform","level":4,"score":0.7222627401351929},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7042685747146606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6975623965263367},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6761324405670166},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.658297598361969},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5838606357574463},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5184563994407654},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.48639658093452454},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.42983508110046387},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42376774549484253},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.19731876254081726},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1587125062942505},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.05892753601074219},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D005583","descriptor_name":"Fourier Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006802","descriptor_name":"Human Activities","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D005583","descriptor_name":"Fourier Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006802","descriptor_name":"Human Activities","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D005583","descriptor_name":"Fourier Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006802","descriptor_name":"Human Activities","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":4,"locations":[{"id":"doi:10.1109/tpami.2021.3076522","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3076522","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:33914681","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33914681","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null},{"id":"mag:3045186380","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2007.11365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2007.11365","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2007.11365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"mag:3045186380","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2007.11365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":86,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W639708223","https://openalex.org/W1522734439","https://openalex.org/W1578985305","https://openalex.org/W1582347098","https://openalex.org/W1938864827","https://openalex.org/W2016053056","https://openalex.org/W2097117768","https://openalex.org/W2100115174","https://openalex.org/W2126579184","https://openalex.org/W2156303437","https://openalex.org/W2163605009","https://openalex.org/W2168137677","https://openalex.org/W2194775991","https://openalex.org/W2279098554","https://openalex.org/W2308045930","https://openalex.org/W2342662179","https://openalex.org/W2412782625","https://openalex.org/W2507009361","https://openalex.org/W2531409750","https://openalex.org/W2549139847","https://openalex.org/W2553594924","https://openalex.org/W2553902701","https://openalex.org/W2583938035","https://openalex.org/W2592929672","https://openalex.org/W2612445135","https://openalex.org/W2613718673","https://openalex.org/W2625366777","https://openalex.org/W2736596806","https://openalex.org/W2745519816","https://openalex.org/W2746726611","https://openalex.org/W2752782242","https://openalex.org/W2770804203","https://openalex.org/W2798472916","https://openalex.org/W2798535712","https://openalex.org/W2799146007","https://openalex.org/W2799176631","https://openalex.org/W2809562466","https://openalex.org/W2883429621","https://openalex.org/W2883534172","https://openalex.org/W2883780447","https://openalex.org/W2884797191","https://openalex.org/W2893150766","https://openalex.org/W2895243423","https://openalex.org/W2904072229","https://openalex.org/W2910603373","https://openalex.org/W2930709109","https://openalex.org/W2962684187","https://openalex.org/W2962934715","https://openalex.org/W2962980542","https://openalex.org/W2963087201","https://openalex.org/W2963091558","https://openalex.org/W2963125010","https://openalex.org/W2963155035","https://openalex.org/W2963163009","https://openalex.org/W2963326767","https://openalex.org/W2963420686","https://openalex.org/W2963457877","https://openalex.org/W2963524571","https://openalex.org/W2963616706","https://openalex.org/W2963645879","https://openalex.org/W2963743626","https://openalex.org/W2963820951","https://openalex.org/W2964094092","https://openalex.org/W2964191259","https://openalex.org/W2964452879","https://openalex.org/W2981385151","https://openalex.org/W2981548405","https://openalex.org/W2984287396","https://openalex.org/W2988396473","https://openalex.org/W2988630963","https://openalex.org/W2990152177","https://openalex.org/W2990503944","https://openalex.org/W3009812836","https://openalex.org/W3016221831","https://openalex.org/W3034572008","https://openalex.org/W4246193833","https://openalex.org/W6600983433","https://openalex.org/W6682864246","https://openalex.org/W6685802191","https://openalex.org/W6695314431","https://openalex.org/W6737664043","https://openalex.org/W6742667445","https://openalex.org/W6753955284","https://openalex.org/W6756539395","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W3159557112","https://openalex.org/W2971742398","https://openalex.org/W2930709109","https://openalex.org/W3004500412","https://openalex.org/W2755843045","https://openalex.org/W3010074710","https://openalex.org/W3128140182","https://openalex.org/W2964590182","https://openalex.org/W2748434587","https://openalex.org/W3030420691","https://openalex.org/W3164049065","https://openalex.org/W2788945907","https://openalex.org/W2907719996","https://openalex.org/W3041169370","https://openalex.org/W2937887488","https://openalex.org/W2883723049","https://openalex.org/W2527636115","https://openalex.org/W2897077592","https://openalex.org/W2516608830","https://openalex.org/W2963828468"],"abstract_inverted_index":{"Conventional":[0],"3D":[1,54,61,109,146,178],"convolutional":[2,44,55,147],"neural":[3],"networks":[4],"(CNNs)":[5],"are":[6,140],"computationally":[7],"expensive,":[8],"memory":[9],"intensive,":[10],"prone":[11],"to":[12,21,52,116,123,131,188],"overfitting,":[13],"and":[14,57,121,149,163,170],"most":[15],"importantly,":[16],"there":[17],"is":[18],"a":[19,40,80,90],"need":[20],"improve":[22],"their":[23,136],"feature":[24,137],"learning":[25,97,138],"capabilities.":[26],"To":[27],"address":[28],"these":[29],"issues,":[30],"we":[31],"propose":[32],"spatio-temporal":[33],"short":[34],"term":[35],"Fourier":[36,77],"transform":[37],"(STFT)":[38],"blocks,":[39],"new":[41],"class":[42],"of":[43,67,92],"blocks":[45,102,176],"that":[46,71,174],"can":[47],"serve":[48],"as":[49],"an":[50],"alternative":[51],"the":[53,105,132,144,189],"layer":[56,148],"its":[58,150],"variants":[59],"in":[60,108],"CNNs.":[62,110],"An":[63],"STFT":[64,81,101,175],"block":[65],"consists":[66],"non-trainable":[68],"convolution":[69],"layers":[70],"capture":[72],"spatially":[73],"and/or":[74],"temporally":[75],"local":[76],"information":[78],"using":[79],"kernel":[82],"at":[83],"multiple":[84],"low":[85],"frequency":[86],"points,":[87],"followed":[88],"by":[89],"set":[91],"trainable":[93],"linear":[94],"weights":[95],"for":[96],"channel":[98],"correlations.":[99],"The":[100],"significantly":[103,141],"reduce":[104],"space-time":[106],"complexity":[107],"In":[111],"general,":[112],"they":[113],"use":[114],"3.5":[115],"4.5":[117],"times":[118,125],"less":[119,126],"parameters":[120],"1.5":[122],"1.8":[124],"computational":[127],"costs":[128],"when":[129],"compared":[130,187],"state-of-the-art":[133,190],"methods.":[134,191],"Furthermore,":[135],"capabilities":[139],"better":[142,185],"than":[143],"conventional":[145],"variants.":[151],"Our":[152],"extensive":[153],"evaluation":[154],"on":[155,181],"seven":[156],"action":[157],"recognition":[158],"datasets,":[159],"including":[160],"Something-something":[161],"v1":[162],"v2,":[164],"Jester,":[165],"Diving-48,":[166],"Kinetics-400,":[167],"UCF":[168],"101,":[169],"HMDB":[171],"51,":[172],"demonstrate":[173],"based":[177],"CNNs":[179],"achieve":[180],"par":[182],"or":[183],"even":[184],"performance":[186]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
