{"id":"https://openalex.org/W4200426370","doi":"https://doi.org/10.1109/cisp-bmei53629.2021.9624415","title":"Skimming and Scanning for Efficient Action Recognition in Untrimmed Videos","display_name":"Skimming and Scanning for Efficient Action Recognition in Untrimmed Videos","publication_year":2021,"publication_date":"2021-10-23","ids":{"openalex":"https://openalex.org/W4200426370","doi":"https://doi.org/10.1109/cisp-bmei53629.2021.9624415"},"language":"en","primary_location":{"id":"doi:10.1109/cisp-bmei53629.2021.9624415","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cisp-bmei53629.2021.9624415","pdf_url":null,"source":{"id":"https://openalex.org/S4363605805","display_name":"2021 14th International Congress on Image and Signal Processing, BioMedical Engineering and Informatics (CISP-BMEI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 14th International Congress on Image and Signal Processing, BioMedical Engineering and Informatics (CISP-BMEI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yunyan Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunyan Hong","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075207922","display_name":"Ailing Zeng","orcid":"https://orcid.org/0000-0002-3783-0679"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Ailing Zeng","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100719011","display_name":"Min Li","orcid":"https://orcid.org/0000-0001-8140-934X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Min Li","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010726528","display_name":"Cewu Lu","orcid":"https://orcid.org/0000-0002-4023-9257"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cewu Lu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100392353","display_name":"Li Jiang","orcid":"https://orcid.org/0000-0001-7058-6957"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Jiang","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088556682","display_name":"Qiang Xu","orcid":"https://orcid.org/0000-0001-6747-126X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qiang Xu","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14340974,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"32","issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/clips","display_name":"CLIPS","score":0.9127129912376404},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.793116569519043},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5333212614059448},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5251088738441467},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5060068964958191},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5012693405151367},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38519465923309326},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3203555941581726}],"concepts":[{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.9127129912376404},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.793116569519043},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5333212614059448},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5251088738441467},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5060068964958191},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5012693405151367},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38519465923309326},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3203555941581726},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cisp-bmei53629.2021.9624415","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cisp-bmei53629.2021.9624415","pdf_url":null,"source":{"id":"https://openalex.org/S4363605805","display_name":"2021 14th International Congress on Image and Signal Processing, BioMedical Engineering and Informatics (CISP-BMEI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 14th International Congress on Image and Signal Processing, BioMedical Engineering and Informatics (CISP-BMEI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W1777628566","https://openalex.org/W1821462560","https://openalex.org/W1927052826","https://openalex.org/W1965555277","https://openalex.org/W1983364832","https://openalex.org/W2016053056","https://openalex.org/W2037497826","https://openalex.org/W2151388695","https://openalex.org/W2194775991","https://openalex.org/W2550143307","https://openalex.org/W2619947201","https://openalex.org/W2788945907","https://openalex.org/W2799176631","https://openalex.org/W2807968599","https://openalex.org/W2955425717","https://openalex.org/W2962934715","https://openalex.org/W2963155035","https://openalex.org/W2963526497","https://openalex.org/W2963616706","https://openalex.org/W2963820951","https://openalex.org/W2978725006","https://openalex.org/W2981548405","https://openalex.org/W2984287396","https://openalex.org/W2990503944","https://openalex.org/W2992059788","https://openalex.org/W3004505825","https://openalex.org/W3010010212","https://openalex.org/W3015793166","https://openalex.org/W3034658206","https://openalex.org/W3037046522","https://openalex.org/W3082925502","https://openalex.org/W3103366418","https://openalex.org/W3107849462","https://openalex.org/W6638523607","https://openalex.org/W6687483927","https://openalex.org/W6743149407","https://openalex.org/W6748831540","https://openalex.org/W6762718338","https://openalex.org/W6767318615","https://openalex.org/W6776290648","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2417253731","https://openalex.org/W2350469024","https://openalex.org/W2395860100","https://openalex.org/W2036154621","https://openalex.org/W795077857","https://openalex.org/W2074513378","https://openalex.org/W2376416463","https://openalex.org/W2007338512","https://openalex.org/W2057384895","https://openalex.org/W2360858150"],"abstract_inverted_index":{"Video":[0],"action":[1],"recognition":[2],"(VAR)":[3],"aims":[4],"to":[5,60,65,78,106,173,191,200,223],"classify":[6],"videos":[7,30,36,41,88],"into":[8],"a":[9,16,62,90,135],"predefined":[10],"set":[11],"of":[12,19,28,100,110,194,221,252],"classes,":[13],"which":[14],"is":[15,54,76,103],"primary":[17],"task":[18],"video":[20,154],"understanding.":[21],"We":[22],"mainly":[23],"focus":[24],"on":[25,142,235],"the":[26,52,67,80,98,129,146,152,163,187,192,195,207,219,226,247],"VAR":[27],"untrimmed":[29,125],"because":[31],"they":[32],"are":[33,233],"most":[34,71],"common":[35],"in":[37,124,250],"real-life":[38],"scenes.":[39],"Untrimmed":[40],"have":[42],"redundant":[43,175],"and":[44,86,93,97,117,155,159,213,229,237,240,254],"diverse":[45,170],"clips":[46,53,85,168,176,189],"containing":[47],"contextual":[48],"information,":[49],"so":[50],"sampling":[51],"essential.":[55],"Recently,":[56],"some":[57],"works":[58],"attempt":[59],"train":[61],"generic":[63],"model":[64,79,92],"select":[66,186],"<tex":[68],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[69],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$N$</tex>":[70],"representative":[72],"clips.":[73,161],"However,":[74],"it":[75,166],"difficult":[77],"complex":[81],"relations":[82,102],"from":[83],"intra-class":[84],"inter-class":[87],"within":[89],"single":[91],"fixed":[94],"selected":[95],"number,":[96],"entanglement":[99],"multiple":[101],"also":[104],"hard":[105],"explain.":[107],"Thus,":[108,216],"instead":[109],"\u201conly":[111],"look":[112],"once\u201d,":[113],"we":[114,133,205,217],"argue":[115],"\u201cdivide":[116],"conquer\u201d":[118],"strategy":[119],"will":[120],"be":[121],"more":[122],"suitable":[123],"VAR.":[126],"Inspired":[127],"by":[128],"speed":[130],"reading":[131],"mechanism,":[132],"propose":[134],"simple":[136],"yet":[137],"effective":[138],"clip-level":[139],"solution":[140,245],"based":[141],"skim-scan":[143],"techniques.":[144],"Specifically,":[145],"proposed":[147],"Skim-Scan":[148],"framework":[149],"first":[150],"skims":[151],"entire":[153],"drops":[156],"those":[157],"uninformative":[158],"misleading":[160],"For":[162],"remaining":[164],"clips,":[165],"scans":[167],"with":[169],"features":[171],"gradually":[172],"drop":[174],"but":[177],"cover":[178],"essential":[179],"content.":[180],"The":[181],"above":[182],"strategies":[183],"can":[184],"adaptively":[185],"necessary":[188],"according":[190],"difficulty":[193],"different":[196],"videos.":[197],"In":[198],"order":[199],"further":[201],"cut":[202],"computational":[203,227],"overhead,":[204],"observe":[206],"similar":[208],"statistical":[209],"expression":[210],"between":[211],"lightweight":[212],"heavy":[214],"networks.":[215],"explore":[218],"combination":[220],"them":[222],"trade":[224],"off":[225],"complexity":[228],"performance.":[230],"Comprehensive":[231],"experiments":[232],"performed":[234],"ActivityNet":[236],"mini-FCVID":[238],"datasets,":[239],"results":[241],"demonstrate":[242],"that":[243],"our":[244],"surpasses":[246],"state-of-the-art":[248],"performance":[249],"terms":[251],"accuracy":[253],"efficiency.":[255]},"counts_by_year":[],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
