{"id":"https://openalex.org/W4393191810","doi":"https://doi.org/10.1145/3654671","title":"Discriminative Segment Focus Network for Fine-grained Video Action Recognition","display_name":"Discriminative Segment Focus Network for Fine-grained Video Action Recognition","publication_year":2024,"publication_date":"2024-03-26","ids":{"openalex":"https://openalex.org/W4393191810","doi":"https://doi.org/10.1145/3654671"},"language":"en","primary_location":{"id":"doi:10.1145/3654671","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654671","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654671","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3654671","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020149992","display_name":"Baoli Sun","orcid":"https://orcid.org/0000-0002-2861-4288"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Baoli Sun","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055580414","display_name":"Xinchen Ye","orcid":"https://orcid.org/0000-0001-5328-3911"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinchen Ye","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060794007","display_name":"Tiantian Yan","orcid":"https://orcid.org/0000-0002-0811-9706"},"institutions":[{"id":"https://openalex.org/I4210092944","display_name":"Dalian University","ror":"https://ror.org/00g2ypp58","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210092944"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiantian Yan","raw_affiliation_strings":["Dalian University, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University, Dalian, China","institution_ids":["https://openalex.org/I4210092944"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100438119","display_name":"Zhihui Wang","orcid":"https://orcid.org/0000-0002-5011-9726"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]},{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["AU","CN"],"is_corresponding":false,"raw_author_name":"Zhihui Wang","raw_affiliation_strings":["Dalian University of Technology, Dalian, China","The University of Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]},{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100616471","display_name":"Haojie Li","orcid":"https://orcid.org/0000-0003-3882-2205"},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haojie Li","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100443935","display_name":"Zhiyong Wang","orcid":"https://orcid.org/0000-0002-8043-0312"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]},{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU","CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Wang","raw_affiliation_strings":["Dalian University of Technology, Dalian, China","The University of Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]},{"raw_affiliation_string":"The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5020149992"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":1.2999,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80071027,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"20","issue":"7","first_page":"1","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8113111257553101},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6761268377304077},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6658053398132324},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.5444572567939758},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5325763821601868},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4459196925163269},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4423050284385681}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8113111257553101},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6761268377304077},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6658053398132324},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.5444572567939758},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5325763821601868},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4459196925163269},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4423050284385681},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3654671","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654671","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654671","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3654671","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654671","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654671","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7300000190734863}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4393191810.pdf","grobid_xml":"https://content.openalex.org/works/W4393191810.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W2116341502","https://openalex.org/W2296703396","https://openalex.org/W2464235600","https://openalex.org/W2604314403","https://openalex.org/W2795043468","https://openalex.org/W2963246338","https://openalex.org/W2972743300","https://openalex.org/W3099204742","https://openalex.org/W3110854813","https://openalex.org/W3159051440","https://openalex.org/W3185943380","https://openalex.org/W3189670121","https://openalex.org/W3212852649","https://openalex.org/W3212953023","https://openalex.org/W4214612132","https://openalex.org/W4247950230","https://openalex.org/W4281666112","https://openalex.org/W4281749424","https://openalex.org/W4296913481","https://openalex.org/W4306319959","https://openalex.org/W4321770538","https://openalex.org/W4324394311","https://openalex.org/W4377096805","https://openalex.org/W4379986307","https://openalex.org/W4386091161","https://openalex.org/W4386195714","https://openalex.org/W6757634740","https://openalex.org/W6855451908"],"related_works":["https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W2404514746","https://openalex.org/W1652783584","https://openalex.org/W2082783427","https://openalex.org/W1576128429","https://openalex.org/W2182357018","https://openalex.org/W2269464716"],"abstract_inverted_index":{"Fine-grained":[0],"video":[1,81,170],"action":[2,19,82,165,181,190],"recognition":[3,20,182,191],"aims":[4],"at":[5,100],"identifying":[6],"minor":[7],"and":[8,43,74,104,143,186,188,195],"discriminative":[9,36,76,117],"variations":[10,45],"among":[11,35],"fine":[12],"categories":[13],"of":[14,71,134,147,167,200],"actions.":[15,55],"While":[16],"many":[17],"recent":[18],"methods":[21],"have":[22],"been":[23,47],"proposed":[24],"to":[25,31,39,67,124],"better":[26],"model":[27,32],"spatio-temporal":[28],"representations,":[29],"how":[30],"the":[33,69,110,126,131,138,141,144,163,168,198,205],"interactions":[34],"atomic":[37],"actions":[38],"effectively":[40],"characterize":[41],"inter-class":[42],"intra-class":[44],"has":[46],"neglected,":[48],"which":[49,93],"is":[50,122],"vital":[51],"for":[52,79,171],"understanding":[53],"fine-grained":[54,80,180],"In":[56],"this":[57],"work,":[58],"we":[59,85],"devise":[60],"a":[61,87,116,148,152],"Discriminative":[62],"Segment":[63],"Focus":[64],"Network":[65],"(DSFNet)":[66],"mine":[68],"discriminability":[70,142],"segment":[72,107,118,150,158],"correlations":[73,96,111],"localize":[75,125],"action-relevant":[77,128],"segments":[78,99,129],"recognition.":[83,174],"Firstly,":[84],"propose":[86],"hierarchic":[88],"correlation":[89],"reasoning":[90],"(HCR)":[91],"module":[92,121],"explicitly":[94],"establishes":[95],"between":[97,140],"different":[98],"multiple":[101],"temporal":[102],"scales":[103],"enhances":[105],"each":[106],"by":[108,136],"exploiting":[109],"with":[112,151,162,204],"other":[113],"segments.":[114],"Secondly,":[115],"focus":[119],"(DSF)":[120],"devised":[123],"most":[127],"from":[130],"enhanced":[132],"representations":[133,159],"HCR":[135],"enforcing":[137],"consistency":[139,153],"classification":[145],"confidence":[146],"given":[149],"constraint.":[154],"Finally,":[155],"these":[156],"localized":[157],"are":[160],"combined":[161],"global":[164],"representation":[166],"whole":[169],"boosting":[172],"final":[173],"Extensive":[175],"experimental":[176],"results":[177],"on":[178],"two":[179,189],"datasets,":[183,192],"i.e.,":[184,193],"FineGym":[185],"Diving48,":[187],"Kinetics400":[194],"Something-Something,":[196],"demonstrate":[197],"effectiveness":[199],"our":[201],"approach":[202],"compared":[203],"state-of-the-art":[206],"methods.":[207]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
