{"id":"https://openalex.org/W2943070176","doi":"https://doi.org/10.1109/tcsvt.2018.2830102","title":"Semantic Cues Enhanced Multimodality Multistream CNN for Action Recognition","display_name":"Semantic Cues Enhanced Multimodality Multistream CNN for Action Recognition","publication_year":2018,"publication_date":"2018-04-25","ids":{"openalex":"https://openalex.org/W2943070176","doi":"https://doi.org/10.1109/tcsvt.2018.2830102","mag":"2943070176"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2018.2830102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2018.2830102","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074405661","display_name":"Zhigang Tu","orcid":"https://orcid.org/0000-0001-5003-2260"},"institutions":[{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]},{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhigang Tu","raw_affiliation_strings":["State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100678496","display_name":"Wei Xie","orcid":"https://orcid.org/0000-0002-7840-5652"},"institutions":[{"id":"https://openalex.org/I40963666","display_name":"Central China Normal University","ror":"https://ror.org/03x1jna21","country_code":"CN","type":"education","lineage":["https://openalex.org/I40963666"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Xie","raw_affiliation_strings":["School of Computer, Central China Normal University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer, Central China Normal University, Wuhan, China","institution_ids":["https://openalex.org/I40963666"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082613025","display_name":"Justin Dauwels","orcid":"https://orcid.org/0000-0002-4390-1568"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Justin Dauwels","raw_affiliation_strings":["School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032615847","display_name":"Baoxin Li","orcid":"https://orcid.org/0000-0002-9294-4572"},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Baoxin Li","raw_affiliation_strings":["School of Computing, Informatics, Decision System Engineering, Arizona State University, Tempe, AZ, USA"],"affiliations":[{"raw_affiliation_string":"School of Computing, Informatics, Decision System Engineering, Arizona State University, Tempe, AZ, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085245110","display_name":"Junsong Yuan","orcid":"https://orcid.org/0000-0002-7901-8793"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Junsong Yuan","raw_affiliation_strings":["Computer Science and Engineering Department, State University of New York at Buffalo, Buffalo, NY, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Department, State University of New York at Buffalo, Buffalo, NY, USA","institution_ids":["https://openalex.org/I63190737"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5074405661"],"corresponding_institution_ids":["https://openalex.org/I37461747","https://openalex.org/I4210118728"],"apc_list":null,"apc_paid":null,"fwci":5.099,"has_fulltext":false,"cited_by_count":117,"citation_normalized_percentile":{"value":0.96703947,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"29","issue":"5","first_page":"1423","last_page":"1437"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8729588985443115},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7115522623062134},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6886913180351257},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6762971878051758},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.567982017993927},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5298043489456177},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5099998712539673},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5046275854110718},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.4839966297149658},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.42958149313926697},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.37188684940338135},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.07899010181427002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8729588985443115},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7115522623062134},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6886913180351257},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6762971878051758},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.567982017993927},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5298043489456177},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5099998712539673},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5046275854110718},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4839966297149658},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.42958149313926697},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37188684940338135},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.07899010181427002},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcsvt.2018.2830102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2018.2830102","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/142212","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/142212","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.5299999713897705,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G474122932","display_name":null,"funder_award_id":"2014CFB461","funder_id":"https://openalex.org/F4320322186","funder_display_name":"Natural Science Foundation of Hubei Province"},{"id":"https://openalex.org/G855221287","display_name":null,"funder_award_id":"61501198","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322186","display_name":"Natural Science Foundation of Hubei Province","ror":null},{"id":"https://openalex.org/F4320332641","display_name":"University at Buffalo","ror":"https://ror.org/01y64my43"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":89,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W181493107","https://openalex.org/W639708223","https://openalex.org/W1522734439","https://openalex.org/W1686810756","https://openalex.org/W1744759976","https://openalex.org/W1836465849","https://openalex.org/W1871385855","https://openalex.org/W1909538523","https://openalex.org/W1920196880","https://openalex.org/W1923332106","https://openalex.org/W1932624639","https://openalex.org/W1944615693","https://openalex.org/W1954128991","https://openalex.org/W1965301399","https://openalex.org/W1982075130","https://openalex.org/W2010181071","https://openalex.org/W2012592962","https://openalex.org/W2016053056","https://openalex.org/W2034014085","https://openalex.org/W2047670868","https://openalex.org/W2050398567","https://openalex.org/W2052530028","https://openalex.org/W2062563118","https://openalex.org/W2064675550","https://openalex.org/W2073280062","https://openalex.org/W2079241389","https://openalex.org/W2087461551","https://openalex.org/W2088049833","https://openalex.org/W2097117768","https://openalex.org/W2101194540","https://openalex.org/W2102605133","https://openalex.org/W2105101328","https://openalex.org/W2113708607","https://openalex.org/W2118246710","https://openalex.org/W2118490033","https://openalex.org/W2122076510","https://openalex.org/W2126579184","https://openalex.org/W2133059825","https://openalex.org/W2138682569","https://openalex.org/W2156303437","https://openalex.org/W2163588226","https://openalex.org/W2163605009","https://openalex.org/W2163665255","https://openalex.org/W2193384753","https://openalex.org/W2194775991","https://openalex.org/W2212903133","https://openalex.org/W2214352687","https://openalex.org/W2235034809","https://openalex.org/W2295598507","https://openalex.org/W2308045930","https://openalex.org/W2342662179","https://openalex.org/W2417131217","https://openalex.org/W2460260369","https://openalex.org/W2461621749","https://openalex.org/W2507009361","https://openalex.org/W2519080876","https://openalex.org/W2526449353","https://openalex.org/W2526479943","https://openalex.org/W2534890794","https://openalex.org/W2553594924","https://openalex.org/W2560474170","https://openalex.org/W2563717578","https://openalex.org/W2608229591","https://openalex.org/W2608988379","https://openalex.org/W2613635555","https://openalex.org/W2739980858","https://openalex.org/W2962835968","https://openalex.org/W2963173190","https://openalex.org/W2963524571","https://openalex.org/W2963753350","https://openalex.org/W2964072322","https://openalex.org/W2964222622","https://openalex.org/W6600983433","https://openalex.org/W6607209805","https://openalex.org/W6620707391","https://openalex.org/W6637373629","https://openalex.org/W6638667902","https://openalex.org/W6640153615","https://openalex.org/W6682864246","https://openalex.org/W6684191040","https://openalex.org/W6689710714","https://openalex.org/W6697075695","https://openalex.org/W6724944384","https://openalex.org/W6727074247","https://openalex.org/W6727508588","https://openalex.org/W6729814214","https://openalex.org/W6736855692","https://openalex.org/W6737535144"],"related_works":["https://openalex.org/W4321487865","https://openalex.org/W4313906399","https://openalex.org/W4239306820","https://openalex.org/W4391266461","https://openalex.org/W2590798552","https://openalex.org/W2811106690","https://openalex.org/W2947043951","https://openalex.org/W4399188509","https://openalex.org/W2318112981","https://openalex.org/W2507540959"],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"the":[3,33,36,50,109,118,132,140,145,148,165,183,193,210,214],"issue":[4],"of":[5,35,56,91,139,147,159,177,185],"video-based":[6],"action":[7,38,186],"recognition":[8,39,187],"by":[9],"exploiting":[10],"an":[11,122],"advanced":[12],"multistream":[13,155],"convolutional":[14],"neural":[15],"network":[16,51,150,156],"(CNN)":[17],"to":[18,43,61,88,127,152,164,171],"fully":[19],"use":[20,172],"semantics-derived":[21],"multiple":[22],"modalities":[23],"in":[24,108,179],"both":[25],"spatial":[26],"(appearance)":[27],"and":[28,49,134,207],"temporal":[29],"(motion)":[30],"domains,":[31],"since":[32],"performance":[34,184],"CNN-based":[37],"methods":[40],"heavily":[41],"relates":[42],"two":[44,57,129],"factors:":[45],"semantic":[46,130],"visual":[47,175],"cues":[48],"architecture.":[52],"Our":[53],"work":[54],"consists":[55,158],"major":[58],"parts.":[59],"First,":[60],"extract":[62],"useful":[63],"human-related":[64,195],"semantics":[65,196],"accurately,":[66],"we":[67,143],"propose":[68],"a":[69,96,154],"novel":[70],"spatiotemporal":[71],"saliency-based":[72],"video":[73,111],"object":[74,89,93],"segmentation":[75],"(STS)":[76],"model.":[77],"By":[78],"fusing":[79],"different":[80],"distinctive":[81,136],"saliency":[82,120],"maps,":[83,121],"which":[84,168],"are":[85],"computed":[86],"according":[87],"signatures":[90],"complementary":[92],"detection":[94],"approaches,":[95],"refined":[97],"STS":[98],"maps":[99],"can":[100,112],"be":[101,113],"obtained.":[102],"In":[103],"this":[104],"way,":[105],"various":[106],"challenges":[107],"realistic":[110],"handled":[114],"jointly.":[115],"Based":[116],"on":[117,201],"estimated":[119],"energy":[123],"function":[124],"is":[125,169,188],"constructed":[126],"segment":[128],"cues:":[131],"actor":[133],"one":[135],"acting":[137],"part":[138],"actor.":[141],"Second,":[142],"modify":[144],"architecture":[146],"two-stream":[149],"(TS-Net)":[151],"design":[153],"that":[157,209],"three":[160],"TS-Nets":[161],"with":[162],"respect":[163],"extracted":[166],"semantics,":[167],"able":[170],"deeper":[173],"abstract":[174],"features":[176],"multimodalities":[178],"multi-scale":[180],"spatiotemporally.":[181],"Importantly,":[182],"significantly":[189],"boosted":[190],"when":[191],"integrating":[192],"captured":[194],"into":[197],"our":[198],"framework.":[199],"Experiments":[200],"four":[202],"public":[203],"benchmarks-JHMDB,":[204],"HMDB51,":[205],"UCF-Sports,":[206],"UCF101-demonstrate":[208],"proposed":[211],"method":[212],"outperforms":[213],"state-of-the-art":[215],"algorithms.":[216]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":24},{"year":2022,"cited_by_count":23},{"year":2021,"cited_by_count":24},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":4}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
