{"id":"https://openalex.org/W3133237556","doi":"https://doi.org/10.3233/jifs-189714","title":"Multi-scale spatialtemporal information deep fusion network with temporal pyramid mechanism for video action recognition","display_name":"Multi-scale spatialtemporal information deep fusion network with temporal pyramid mechanism for video action recognition","publication_year":2021,"publication_date":"2021-02-16","ids":{"openalex":"https://openalex.org/W3133237556","doi":"https://doi.org/10.3233/jifs-189714","mag":"3133237556"},"language":"en","primary_location":{"id":"doi:10.3233/jifs-189714","is_oa":false,"landing_page_url":"https://doi.org/10.3233/jifs-189714","pdf_url":null,"source":{"id":"https://openalex.org/S179157397","display_name":"Journal of Intelligent & Fuzzy Systems","issn_l":"1064-1246","issn":["1064-1246","1875-8967"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Intelligent &amp; Fuzzy Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030920466","display_name":"Hongshi Ou","orcid":"https://orcid.org/0000-0002-7669-5959"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongshi Ou","raw_affiliation_strings":["South China University of Technology, School of Electronic and Information Engineering, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology, School of Electronic and Information Engineering, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100327194","display_name":"Jifeng Sun","orcid":"https://orcid.org/0000-0002-0201-8226"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jifeng Sun","raw_affiliation_strings":["South China University of Technology, School of Electronic and Information Engineering, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology, School of Electronic and Information Engineering, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5030920466"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":0.3843,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.58694444,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"41","issue":"3","first_page":"4533","last_page":"4545"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8037418127059937},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6704146265983582},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.6224028468132019},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.5916709303855896},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5753620266914368},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5527545213699341},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.547377347946167},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.49165016412734985},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.45711469650268555},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4513850808143616},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35642915964126587},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3308424651622772},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.0816778838634491},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.07721620798110962}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8037418127059937},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6704146265983582},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.6224028468132019},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.5916709303855896},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5753620266914368},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5527545213699341},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.547377347946167},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.49165016412734985},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.45711469650268555},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4513850808143616},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35642915964126587},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3308424651622772},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0816778838634491},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.07721620798110962},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/jifs-189714","is_oa":false,"landing_page_url":"https://doi.org/10.3233/jifs-189714","pdf_url":null,"source":{"id":"https://openalex.org/S179157397","display_name":"Journal of Intelligent & Fuzzy Systems","issn_l":"1064-1246","issn":["1064-1246","1875-8967"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Intelligent &amp; Fuzzy Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W147001025","https://openalex.org/W1522734439","https://openalex.org/W1797109199","https://openalex.org/W1947481528","https://openalex.org/W2016053056","https://openalex.org/W2049209908","https://openalex.org/W2142194269","https://openalex.org/W2341234201","https://openalex.org/W2342662179","https://openalex.org/W2345314779","https://openalex.org/W2466991859","https://openalex.org/W2490266937","https://openalex.org/W2558383949","https://openalex.org/W2613635555","https://openalex.org/W2962852931","https://openalex.org/W2964191259","https://openalex.org/W6680835844"],"related_works":["https://openalex.org/W3148227991","https://openalex.org/W1486593826","https://openalex.org/W2771174107","https://openalex.org/W1536965844","https://openalex.org/W2344941099","https://openalex.org/W4322212724","https://openalex.org/W2106788855","https://openalex.org/W3081561710","https://openalex.org/W2477413883","https://openalex.org/W2463773089"],"abstract_inverted_index":{"In":[0],"the":[1,7,10,21,25,86,96,105,119,137,147,151,154,159,168,171,183,200],"deep":[2,49,186],"learning-based":[3],"video":[4,43,162,173,203],"action":[5,174,204],"recognitio,":[6],"function":[8],"of":[9,24,29,51,85,100,108,123,140,153,202],"neural":[11],"network":[12,41,56,131,160,188],"is":[13,132],"to":[14,73,94,117,134,145],"acquire":[15,146],"spatial":[16,75],"information,":[17,19],"motion":[18,78,83],"and":[20,63,77,82],"associated":[22],"information":[23,30,46,76,81,84,99,107,122,139,149,164,185],"above":[26],"two":[27],"kinds":[28],"over":[31],"an":[32],"uneven":[33],"time":[34,88,125],"span.":[35],"This":[36],"paper":[37,192],"puts":[38],"forward":[39],"a":[40,101,194],"extracting":[42],"sequence":[44],"semantic":[45],"based":[47],"on":[48,136,170],"integration":[50,93],"local":[52,120],"Spatial-Temporal":[53,65,98,106,121,138,184],"information.":[54,79],"The":[55],"uses":[57],"2D":[58],"Convolutional":[59,68],"Neural":[60,69],"Network":[61,70],"(2DCNN)":[62],"Multi":[64],"scale":[66],"3D":[67,91],"(MST_3DCNN)":[71],"respectively":[72],"extract":[74],"Spatial":[80],"same":[87],"quantum":[89],"receive":[90],"convolutional":[92],"generate":[95,118],"temporary":[97],"certain":[102],"moment.":[103],"Then,":[104],"multiple":[109,124],"single":[110],"moments":[111],"enters":[112],"Temporal":[113],"Pyramid":[114],"Net":[115],"(TPN)":[116],"scales.":[126],"Finally,":[127],"bidirectional":[128],"recurrent":[129],"neutral":[130],"used":[133],"act":[135],"all":[141],"parts":[142],"so":[143],"as":[144],"context":[148,163],"spanning":[150],"length":[152],"entire":[155],"video,":[156],"which":[157],"endows":[158],"with":[161],"extraction":[165],"capability.":[166],"Through":[167],"experiments":[169],"three":[172],"recognitio":[175],"common":[176],"experimental":[177],"data":[178],"sets":[179],"UCF101,":[180],"UCF11,":[181],"UCFSports,":[182],"fusion":[187],"proposed":[189],"in":[190,199],"this":[191],"has":[193],"high":[195],"correct":[196],"recognition":[197],"rate":[198],"task":[201],"recognitio.":[205]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
