{"id":"https://openalex.org/W4414166015","doi":"https://doi.org/10.1109/avss65446.2025.11149978","title":"Are Attention Maps Richer than we Imagined for Action Recognition?","display_name":"Are Attention Maps Richer than we Imagined for Action Recognition?","publication_year":2025,"publication_date":"2025-08-11","ids":{"openalex":"https://openalex.org/W4414166015","doi":"https://doi.org/10.1109/avss65446.2025.11149978"},"language":"en","primary_location":{"id":"doi:10.1109/avss65446.2025.11149978","is_oa":false,"landing_page_url":"https://doi.org/10.1109/avss65446.2025.11149978","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Advanced Visual and Signal-Based Systems (AVSS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-05458820","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057455578","display_name":"Tanay Agrawal","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Tanay Agrawal","raw_affiliation_strings":["INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France","institution_ids":["https://openalex.org/I1326498283"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111100684","display_name":"Abid Ali","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Abid Ali","raw_affiliation_strings":["INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France","institution_ids":["https://openalex.org/I1326498283"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113080270","display_name":"Antitza Dantcheva","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Antitza Dantcheva","raw_affiliation_strings":["INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France","institution_ids":["https://openalex.org/I1326498283"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109863960","display_name":"Fran\u00e7ois Br\u00e9mond","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Francois Bremond","raw_affiliation_strings":["INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Sophia Antipolis &#x2013; M&#x00E9;diterran&#x00E9;e,France","institution_ids":["https://openalex.org/I1326498283"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5057455578"],"corresponding_institution_ids":["https://openalex.org/I1326498283"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21493348,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.972100019454956,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.7479000091552734},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.6837999820709229},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5259000062942505},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4772000014781952},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.3847000002861023},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3749000132083893}],"concepts":[{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.7479000091552734},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7357000112533569},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.6837999820709229},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.67330002784729},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5259000062942505},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4772000014781952},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4438999891281128},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.3847000002861023},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3749000132083893},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.3686000108718872},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3418000042438507},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2565000057220459},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2513999938964844}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/avss65446.2025.11149978","is_oa":false,"landing_page_url":"https://doi.org/10.1109/avss65446.2025.11149978","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Advanced Visual and Signal-Based Systems (AVSS)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-05458820v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05458820","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"AVSS 2025 - IEEE International Conference on Advanced Video and Signal based Surveillance, IEEE, Aug 2025, Tainan, Taiwan","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-05458820v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05458820","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"AVSS 2025 - IEEE International Conference on Advanced Video and Signal based Surveillance, IEEE, Aug 2025, Tainan, Taiwan","raw_type":"Conference papers"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W1903029394","https://openalex.org/W1984219317","https://openalex.org/W2016053056","https://openalex.org/W2102605133","https://openalex.org/W2156303437","https://openalex.org/W2625366777","https://openalex.org/W2883429621","https://openalex.org/W2948058585","https://openalex.org/W2963015194","https://openalex.org/W2963076818","https://openalex.org/W2963315828","https://openalex.org/W2963524571","https://openalex.org/W2963703197","https://openalex.org/W2981923053","https://openalex.org/W2990152177","https://openalex.org/W2990503944","https://openalex.org/W3034572008","https://openalex.org/W3035180180","https://openalex.org/W3035225512","https://openalex.org/W3094502228","https://openalex.org/W3109392981","https://openalex.org/W3110266941","https://openalex.org/W3126721948","https://openalex.org/W3127463479","https://openalex.org/W3153675281","https://openalex.org/W3172942063","https://openalex.org/W3173407577","https://openalex.org/W3173788106","https://openalex.org/W3195577433","https://openalex.org/W3213518743","https://openalex.org/W3215626407","https://openalex.org/W3217059257","https://openalex.org/W4214612132","https://openalex.org/W4214614183","https://openalex.org/W4214727094","https://openalex.org/W4221167396","https://openalex.org/W4225755514","https://openalex.org/W4226079235","https://openalex.org/W4229042118","https://openalex.org/W4282005462","https://openalex.org/W4282943820","https://openalex.org/W4287122891","https://openalex.org/W4295990387","https://openalex.org/W4296151206","https://openalex.org/W4306294758","https://openalex.org/W4310921506","https://openalex.org/W4312349930","https://openalex.org/W4312480274","https://openalex.org/W4312558481","https://openalex.org/W4312560592","https://openalex.org/W4312614039","https://openalex.org/W4312651322","https://openalex.org/W4312658081","https://openalex.org/W4312769131","https://openalex.org/W4312884055","https://openalex.org/W4312915422","https://openalex.org/W4366208220","https://openalex.org/W4379261327","https://openalex.org/W4379382445","https://openalex.org/W4385245566","https://openalex.org/W4386072015","https://openalex.org/W4386076661","https://openalex.org/W4386083024","https://openalex.org/W4390874610","https://openalex.org/W4403488721","https://openalex.org/W4411245363"],"related_works":[],"abstract_inverted_index":{"Deep":[0],"learning":[1],"models":[2,15,202],"are":[3],"becoming":[4],"more":[5],"general":[6],"and":[7,124,147,159,173,187,191,210],"robust":[8],"by":[9],"the":[10,33,69,97,115,154,160,168],"day.":[11],"Specifically,":[12],"image":[13,112,129],"foundation":[14],"have":[16,46,91],"recently":[17],"shown":[18],"exponential":[19],"growth.":[20],"In":[21],"this":[22,30,157,171,179],"work,":[23],"we":[24,45,52,166],"introduce":[25,60],"a":[26,47,65,78,110,211],"way":[27,66],"to":[28,67,133,177],"exploit":[29],"growth":[31],"in":[32,77,94,96,109],"field":[34,98],"of":[35,50,71,99,117,170],"video":[36,201],"classification.":[37],"The":[38],"basic":[39],"idea":[40,158],"here":[41],"is":[42,131],"that":[43,200],"if":[44],"good":[48],"understanding":[49],"space,":[51],"should":[53],"not":[54],"require":[55],"complicated":[56],"spatio-temporal":[57],"processing.":[58],"We":[59,87,182,197],"Attention":[61],"Map":[62],"(AM)":[63],"flow,":[64],"identify":[68],"location":[70],"local":[72],"changes":[73,123],"between":[74],"two":[75],"frames":[76],"video,":[79],"without":[80,114],"adding":[81],"additional":[82],"parameters":[83],"specifically":[84],"for":[85],"it.":[86,119],"utilise":[88],"adapters,":[89],"which":[90],"been":[92],"growing":[93],"popularity":[95],"parameterefficient":[100],"transfer":[101],"learning.":[102],"These":[103],"help":[104],"us":[105],"incorporate":[106],"AM":[107],"flow":[108],"pretrained":[111],"model":[113,130],"need":[116],"finetuning":[118],"With":[120],"just":[121],"these":[122,219],"minimal":[125,149],"temporal":[126],"processing,":[127],"an":[128],"able":[132],"achieve":[134,192],"state-of-the-":[135],"art":[136],"results":[137],"on":[138,207],"popular":[139],"action":[140],"recognition":[141],"datasets":[142,190,209],"with":[143],"low":[144],"training":[145,213],"time":[146],"requiring":[148],"pretraining.":[150],"This":[151],"work":[152,180,217],"explores":[153],"theory":[155],"behind":[156],"intricacies":[161],"involved.":[162],"Through":[163],"relevant":[164],"experiments,":[165],"show":[167,199],"efficacy":[169],"method":[172],"discuss":[174],"various":[175],"ideas":[176],"take":[178],"forward.":[181],"use":[183],"kinetics-400,":[184],"something-something":[185],"v2":[186],"Toyota":[188],"smarthome":[189],"state-of-the-art":[193],"or":[194],"comparable":[195],"results.":[196],"also":[198],"suffer":[203],"from":[204],"extensive":[205],"pretraining":[206],"multiple":[208],"large":[212],"time,":[214],"but":[215],"our":[216],"answers":[218],"problems.":[220],"actionrecognition":[221],"transformers":[222],"image-to-video-models":[223]},"counts_by_year":[],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
