{"id":"https://openalex.org/W4404787826","doi":"https://doi.org/10.1109/tetci.2024.3499995","title":"LoCATe-GAT: Modeling Multi-Scale Local Context and Action Relationships for Zero-Shot Action Recognition","display_name":"LoCATe-GAT: Modeling Multi-Scale Local Context and Action Relationships for Zero-Shot Action Recognition","publication_year":2024,"publication_date":"2024-11-27","ids":{"openalex":"https://openalex.org/W4404787826","doi":"https://doi.org/10.1109/tetci.2024.3499995"},"language":"en","primary_location":{"id":"doi:10.1109/tetci.2024.3499995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2024.3499995","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017150634","display_name":"Sandipan Sarma","orcid":"https://orcid.org/0000-0003-4619-3058"},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Sandipan Sarma","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India"],"raw_orcid":"https://orcid.org/0000-0003-4619-3058","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India","institution_ids":["https://openalex.org/I1317621060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093417652","display_name":"Divyam Singal","orcid":null},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Divyam Singal","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India","institution_ids":["https://openalex.org/I1317621060"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090992514","display_name":"Arijit Sur","orcid":"https://orcid.org/0000-0002-9038-8138"},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Arijit Sur","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India"],"raw_orcid":"https://orcid.org/0000-0002-9038-8138","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Guwahati, Guwahati, India","institution_ids":["https://openalex.org/I1317621060"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5017150634"],"corresponding_institution_ids":["https://openalex.org/I1317621060"],"apc_list":null,"apc_paid":null,"fwci":0.4762,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.65925293,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"9","issue":"4","first_page":"2793","last_page":"2805"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.6508925557136536},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6072219610214233},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6043353080749512},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5336378812789917},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47100749611854553},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.4653765559196472},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.44205591082572937},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3842860162258148},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37804508209228516},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.18283909559249878},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.16644373536109924},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.13339900970458984},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.07990732789039612},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07593134045600891}],"concepts":[{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.6508925557136536},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6072219610214233},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6043353080749512},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5336378812789917},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47100749611854553},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.4653765559196472},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.44205591082572937},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3842860162258148},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37804508209228516},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.18283909559249878},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.16644373536109924},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.13339900970458984},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.07990732789039612},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07593134045600891},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tetci.2024.3499995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2024.3499995","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.41999998688697815,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":82,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W1927052826","https://openalex.org/W2044913453","https://openalex.org/W2064851185","https://openalex.org/W2100771357","https://openalex.org/W2126579184","https://openalex.org/W2250539671","https://openalex.org/W2289084343","https://openalex.org/W2334493732","https://openalex.org/W2463762378","https://openalex.org/W2507611421","https://openalex.org/W2520613337","https://openalex.org/W2605035112","https://openalex.org/W2619947201","https://openalex.org/W2724511873","https://openalex.org/W2810685774","https://openalex.org/W2887051120","https://openalex.org/W2904378456","https://openalex.org/W2928165649","https://openalex.org/W2928966231","https://openalex.org/W2962858109","https://openalex.org/W2963152432","https://openalex.org/W2963499153","https://openalex.org/W2963689837","https://openalex.org/W2963783448","https://openalex.org/W2965373098","https://openalex.org/W3004319625","https://openalex.org/W3016459781","https://openalex.org/W3035254087","https://openalex.org/W3035524453","https://openalex.org/W3080358492","https://openalex.org/W3080742155","https://openalex.org/W3081704724","https://openalex.org/W3092828241","https://openalex.org/W3113141731","https://openalex.org/W3118716190","https://openalex.org/W3126721948","https://openalex.org/W3153979265","https://openalex.org/W3164335275","https://openalex.org/W3175334845","https://openalex.org/W3175528717","https://openalex.org/W3185605671","https://openalex.org/W3200114289","https://openalex.org/W3210609762","https://openalex.org/W3215626407","https://openalex.org/W4205460703","https://openalex.org/W4214746887","https://openalex.org/W4220910168","https://openalex.org/W4221152513","https://openalex.org/W4289752563","https://openalex.org/W4292974679","https://openalex.org/W4294170691","https://openalex.org/W4312254032","https://openalex.org/W4312480274","https://openalex.org/W4312584871","https://openalex.org/W4312614039","https://openalex.org/W4312769131","https://openalex.org/W4313159427","https://openalex.org/W4315606144","https://openalex.org/W4322706798","https://openalex.org/W4361802074","https://openalex.org/W4362653498","https://openalex.org/W4368232702","https://openalex.org/W4380032301","https://openalex.org/W4381198761","https://openalex.org/W4385800770","https://openalex.org/W4386377770","https://openalex.org/W4386973921","https://openalex.org/W4390523490","https://openalex.org/W4390872437","https://openalex.org/W4394698946","https://openalex.org/W6600983433","https://openalex.org/W6726873649","https://openalex.org/W6736160952","https://openalex.org/W6754337694","https://openalex.org/W6766578407","https://openalex.org/W6782388713","https://openalex.org/W6790019176","https://openalex.org/W6791353385","https://openalex.org/W6801567822","https://openalex.org/W6803872405","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W2773965352","https://openalex.org/W2381179799","https://openalex.org/W4411535265","https://openalex.org/W2980279061","https://openalex.org/W2334685461","https://openalex.org/W2366718574","https://openalex.org/W1576128429","https://openalex.org/W2269464716"],"abstract_inverted_index":{"The":[0],"increasing":[1],"number":[2],"of":[3,55,61,184,213],"actions":[4],"in":[5,191],"the":[6,53,57,113,141,155,219,234],"real":[7],"world":[8],"makes":[9],"it":[10],"difficult":[11],"for":[12,30,47,109],"traditional":[13],"deep-learning":[14],"models":[15,26,37,144],"to":[16,40],"recognize":[17],"unseen":[18],"actions.":[19],"Recently,":[20],"pretrained":[21,102],"contrastive":[22],"image-based":[23],"visual-language":[24],"(I-VL)":[25],"have":[27],"been":[28,45],"adapted":[29],"efficient":[31],"\u201czero-shot\u201d":[32],"scene":[33],"understanding.":[34],"Pairing":[35],"such":[36],"with":[38,154],"transformers":[39],"implement":[41],"temporal":[42,138],"modeling":[43,56],"has":[44],"rewarding":[46],"zero-shot":[48],"action":[49,64],"recognition":[50],"(ZSAR).":[51],"However,":[52],"significance":[54],"local":[58,131],"spatial":[59],"context":[60,132],"objects":[62],"and":[63,88,96,117,123,149,171,186,193,205,215,226,230],"environments":[65],"remains":[66],"unexplored.":[67],"In":[68],"this":[69],"work,":[70],"we":[71,175,180,223],"propose":[72],"a":[73,81,89,101,151,210],"ZSAR":[74,198],"framework":[75],"called":[76],"<italic":[77],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[78],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">LoCATe-GAT</i>,":[79],"comprising":[80],"novel":[82],"Local":[83],"Context-Aggregating":[84],"Temporal":[85],"transformer":[86],"(LoCATe)":[87],"Graph":[90],"Attention":[91],"Network":[92],"(GAT).":[93],"Specifically,":[94,179],"image":[95],"text":[97],"encodings":[98],"extracted":[99],"from":[100],"I-VL":[103],"model":[104],"are":[105],"used":[106],"as":[107,232],"inputs":[108],"LoCATe-GAT.":[110],"Motivated":[111],"by":[112,159],"observation":[114],"that":[115],"object-centric":[116],"environmental":[118],"contexts":[119],"drive":[120],"both":[121],"distinguishability":[122],"functional":[124],"similarity":[125],"between":[126,147],"actions,":[127],"LoCATe":[128],"captures":[129],"multi-scale":[130],"using":[133],"dilated":[134],"convolutional":[135],"layers":[136],"during":[137],"modeling.":[139],"Furthermore,":[140],"proposed":[142],"GAT":[143],"semantic":[145],"relationships":[146],"classes":[148],"achieves":[150,209],"strong":[152],"synergy":[153],"video":[156],"embeddings":[157],"produced":[158],"LoCATe.":[160],"Extensive":[161],"experiments":[162],"on":[163,188,195,228],"four":[164],"widely-used":[165],"benchmarks":[166],"\u2013":[167,173],"UCF101,":[168],"HMDB51,":[169],"ActivityNet,":[170],"Kinetics":[172],"show":[174],"achieve":[176],"state-of-the-art":[177],"results.":[178],"obtain":[181],"relative":[182,211],"gains":[183],"3.8%":[185],"4.8%":[187],"these":[189],"datasets":[190,202],"conventional":[192],"16.6%":[194],"UCF101in":[196],"generalized":[197],"settings.":[199],"For":[200],"large-scale":[201],"like":[203],"ActivityNet":[204],"Kinetics,":[206],"our":[207],"method":[208],"gain":[212,224],"31.8%":[214],"27.9%,":[216],"respectively,":[217],"over":[218],"previous":[220],"methods.":[221],"Additionally,":[222],"25.3%":[225],"18.4%":[227],"UCF101":[229],"HMDB51":[231],"per":[233],"recent":[235],"\u201cTruZe\u201d":[236],"evaluation":[237],"protocol.":[238]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
