{"id":"https://openalex.org/W3207340843","doi":"https://doi.org/10.1145/3474085.3475344","title":"DSANet: Dynamic Segment Aggregation Network for Video-Level Representation Learning","display_name":"DSANet: Dynamic Segment Aggregation Network for Video-Level Representation Learning","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3207340843","doi":"https://doi.org/10.1145/3474085.3475344","mag":"3207340843"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475344","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475344","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015819673","display_name":"Wenhao Wu","orcid":"https://orcid.org/0000-0002-8511-743X"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenhao Wu","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101633987","display_name":"Yu\u2010Xiang Zhao","orcid":"https://orcid.org/0009-0004-3102-0730"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuxiang Zhao","raw_affiliation_strings":["Baidu Inc. &amp; Shenzhen Institute of Advanced Technology, CAS, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc. &amp; Shenzhen Institute of Advanced Technology, CAS, Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010906829","display_name":"Yanwu Xu","orcid":"https://orcid.org/0000-0002-1779-931X"},"institutions":[{"id":"https://openalex.org/I170201317","display_name":"University of Pittsburgh","ror":"https://ror.org/01an3r305","country_code":"US","type":"education","lineage":["https://openalex.org/I170201317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanwu Xu","raw_affiliation_strings":["University of Pittsburgh, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"University of Pittsburgh, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I170201317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001865165","display_name":"Xiao Tan","orcid":"https://orcid.org/0000-0001-9162-8570"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Tan","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018276259","display_name":"Dongliang He","orcid":"https://orcid.org/0000-0002-1129-8610"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongliang He","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023883607","display_name":"Zhikang Zou","orcid":"https://orcid.org/0000-0003-3524-2942"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhikang Zou","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100447783","display_name":"Jin Ye","orcid":"https://orcid.org/0000-0002-5842-3968"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Ye","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100444776","display_name":"Yingying Li","orcid":"https://orcid.org/0000-0002-3999-2647"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingying Li","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002617843","display_name":"Mingde Yao","orcid":"https://orcid.org/0000-0001-5994-6288"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingde Yao","raw_affiliation_strings":["Baidu Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc, Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049159057","display_name":"Zichao Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zichao Dong","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031669433","display_name":"Yifeng Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifeng Shi","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5015819673"],"corresponding_institution_ids":["https://openalex.org/I98301712"],"apc_list":null,"apc_paid":null,"fwci":2.0174,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.88803922,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1903","last_page":"1911"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8677951097488403},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5619659423828125},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.4798833429813385},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4761219620704651},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.44904789328575134},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.43678322434425354},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4342239499092102},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4339308738708496},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.42496609687805176},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35972321033477783}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8677951097488403},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5619659423828125},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.4798833429813385},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4761219620704651},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.44904789328575134},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.43678322434425354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4342239499092102},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4339308738708496},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.42496609687805176},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35972321033477783},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3474085.3475344","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475344","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W1927052826","https://openalex.org/W1947481528","https://openalex.org/W2108598243","https://openalex.org/W2507009361","https://openalex.org/W2608988379","https://openalex.org/W2625366777","https://openalex.org/W2752782242","https://openalex.org/W2770804203","https://openalex.org/W2799176631","https://openalex.org/W2806331055","https://openalex.org/W2883429621","https://openalex.org/W2951019013","https://openalex.org/W2952186347","https://openalex.org/W2962744348","https://openalex.org/W2962899219","https://openalex.org/W2963091558","https://openalex.org/W2963155035","https://openalex.org/W2963524571","https://openalex.org/W2963820951","https://openalex.org/W2981385151","https://openalex.org/W2984287396","https://openalex.org/W2990152177","https://openalex.org/W2990503944","https://openalex.org/W2996901793","https://openalex.org/W3004505825","https://openalex.org/W3006408808","https://openalex.org/W3010010212","https://openalex.org/W3034572008","https://openalex.org/W3034768625","https://openalex.org/W3035141718","https://openalex.org/W3035303837"],"related_works":["https://openalex.org/W4293226380","https://openalex.org/W2373300491","https://openalex.org/W2395294869","https://openalex.org/W2378744544","https://openalex.org/W2594301978","https://openalex.org/W2379704676","https://openalex.org/W1998810860","https://openalex.org/W4206442282","https://openalex.org/W2384505857","https://openalex.org/W2355171581"],"abstract_inverted_index":{"Long-range":[0],"and":[1,8,23,101,142],"short-range":[2,20],"temporal":[3,50,87],"modeling":[4,22,117],"are":[5,182],"two":[6],"complementary":[7],"crucial":[9],"aspects":[10],"of":[11,15,44,170],"video":[12,46,123,134,157],"recognition.":[13],"Most":[14],"the":[16,31,49,106,167],"state-of-the-arts":[17],"focus":[18],"on":[19,132,179],"spatio-temporal":[21,42],"then":[24],"average":[25],"multiple":[26],"snippet-level":[27],"predictions":[28],"to":[29,64,75,84,113,144,154,177],"yield":[30],"final":[32,122],"video-level":[33,37],"prediction.":[34],"Thus,":[35],"their":[36],"prediction":[38],"does":[39],"not":[40],"consider":[41],"features":[43],"how":[45],"evolves":[47],"along":[48],"dimension.":[51],"In":[52],"this":[53],"paper,":[54],"we":[55,73],"introduce":[56],"a":[57,77,81],"novel":[58],"Dynamic":[59],"Segment":[60],"Aggregation":[61],"(DSA)":[62],"module":[63,95,100,151],"capture":[65],"relationship":[66],"among":[67,89],"snippets.":[68],"To":[69],"be":[70,103],"more":[71],"specific,":[72],"attempt":[74],"generate":[76],"dynamic":[78],"kernel":[79],"for":[80],"convolutional":[82],"operation":[83],"aggregate":[85],"long-range":[86,116],"information":[88],"adjacent":[90],"snippets":[91],"adaptively.":[92],"The":[93,121],"DSA":[94,150,165],"is":[96,152,173],"an":[97],"efficient":[98],"plug-and-play":[99],"can":[102],"combined":[104],"with":[105,118,164],"off-the-shelf":[107],"clip-based":[108],"models":[109,159],"(i.e.,":[110,137],"TSM,":[111],"I3D)":[112],"perform":[114],"powerful":[115],"minimal":[119],"overhead.":[120],"architecture,":[124],"coined":[125],"as":[126],"DSANet.":[127],"We":[128],"conduct":[129],"extensive":[130],"experiments":[131],"several":[133],"recognition":[135,158],"benchmarks":[136],"Mini-Kinetics-200,":[138],"Kinetics-400,":[139],"Something-Something":[140],"V1":[141],"ActivityNet)":[143],"show":[145],"its":[146],"superiority.":[147],"Our":[148],"proposed":[149],"shown":[153],"benefit":[155],"various":[156],"significantly.":[160],"For":[161],"example,":[162],"equipped":[163],"modules,":[166],"top-1":[168],"accuracy":[169],"I3D":[171],"ResNet-50":[172],"improved":[174],"from":[175],"74.9%":[176],"78.2%":[178],"Kinetics-400.":[180],"Codes":[181],"available":[183],"at":[184],"https://github.com/whwu95/DSANet.":[185]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
