{"id":"https://openalex.org/W4390871670","doi":"https://doi.org/10.1109/iccv51070.2023.00937","title":"Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics","display_name":"Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics","publication_year":2023,"publication_date":"2023-10-01","ids":{"openalex":"https://openalex.org/W4390871670","doi":"https://doi.org/10.1109/iccv51070.2023.00937"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51070.2023.00937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51070.2023.00937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056497425","display_name":"Juntae Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I19268510","display_name":"Qualcomm (United Kingdom)","ror":"https://ror.org/04d3djg48","country_code":"GB","type":"company","lineage":["https://openalex.org/I19268510","https://openalex.org/I4210087596"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Juntae Lee","raw_affiliation_strings":["Qualcomm AI Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Qualcomm AI Research","institution_ids":["https://openalex.org/I19268510"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019095310","display_name":"Mihir Jain","orcid":"https://orcid.org/0000-0001-8929-3847"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mihir Jain","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5091430620","display_name":"Sungrack Yun","orcid":"https://orcid.org/0000-0003-2462-3854"},"institutions":[{"id":"https://openalex.org/I19268510","display_name":"Qualcomm (United Kingdom)","ror":"https://ror.org/04d3djg48","country_code":"GB","type":"company","lineage":["https://openalex.org/I19268510","https://openalex.org/I4210087596"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sungrack Yun","raw_affiliation_strings":["Qualcomm AI Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Qualcomm AI Research","institution_ids":["https://openalex.org/I19268510"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4491,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65531798,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"10180","last_page":"10189"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.6723858714103699},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.6617815494537354},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6368241310119629},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6096090078353882},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5876697301864624},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5231745839118958},{"id":"https://openalex.org/keywords/one-shot","display_name":"One shot","score":0.46495258808135986},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42381593585014343},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.15288707613945007},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08564251661300659},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.07070636749267578},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.06796634197235107}],"concepts":[{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.6723858714103699},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.6617815494537354},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6368241310119629},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6096090078353882},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5876697301864624},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5231745839118958},{"id":"https://openalex.org/C2992734406","wikidata":"https://www.wikidata.org/wiki/Q413267","display_name":"One shot","level":2,"score":0.46495258808135986},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42381593585014343},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.15288707613945007},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08564251661300659},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.07070636749267578},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.06796634197235107},{"id":"https://openalex.org/C191897082","wikidata":"https://www.wikidata.org/wiki/Q11467","display_name":"Metallurgy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccv51070.2023.00937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51070.2023.00937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1522734439","https://openalex.org/W1927052826","https://openalex.org/W1945129080","https://openalex.org/W2336403884","https://openalex.org/W2471143248","https://openalex.org/W2519328139","https://openalex.org/W2593722617","https://openalex.org/W2597958930","https://openalex.org/W2604113307","https://openalex.org/W2798292345","https://openalex.org/W2884293275","https://openalex.org/W2887928923","https://openalex.org/W2962677524","https://openalex.org/W2962709777","https://openalex.org/W2962723986","https://openalex.org/W2962964995","https://openalex.org/W2963045696","https://openalex.org/W2963247196","https://openalex.org/W2963321993","https://openalex.org/W2964214371","https://openalex.org/W2980347982","https://openalex.org/W3009353929","https://openalex.org/W3014205599","https://openalex.org/W3034263732","https://openalex.org/W3034623254","https://openalex.org/W3034912730","https://openalex.org/W3035585099","https://openalex.org/W3035588244","https://openalex.org/W3097664769","https://openalex.org/W3106690272","https://openalex.org/W3171500338","https://openalex.org/W3173698268","https://openalex.org/W3174421047","https://openalex.org/W3175580044","https://openalex.org/W3202076256","https://openalex.org/W3203903323","https://openalex.org/W4213188130","https://openalex.org/W4214562728","https://openalex.org/W4221139382","https://openalex.org/W4283796707","https://openalex.org/W4319300476","https://openalex.org/W6728881024","https://openalex.org/W6751281049","https://openalex.org/W6767471572","https://openalex.org/W6775646717","https://openalex.org/W6790875704","https://openalex.org/W6802611020"],"related_works":["https://openalex.org/W2497720472","https://openalex.org/W4292659306","https://openalex.org/W3044321615","https://openalex.org/W2806221744","https://openalex.org/W2326937258","https://openalex.org/W394267150","https://openalex.org/W2773965352","https://openalex.org/W4294892107","https://openalex.org/W2357748469","https://openalex.org/W2392917037"],"abstract_inverted_index":{"The":[0],"goal":[1],"of":[2,89,134,179],"this":[3,33,63],"paper":[4],"is":[5,29,36,102],"to":[6,38,75,93,105,121,129],"localize":[7],"action":[8,25,46],"instances":[9,142],"in":[10,97,125,143,187],"a":[11,23,44,163],"long":[12],"untrimmed":[13],"query":[14,72,145,170],"video":[15,91,109,124,146,154,173],"using":[16,59],"just":[17],"meager":[18],"trimmed":[19],"support":[20,49,69,90,108,123,136,153,172],"videos":[21,70],"representing":[22,43],"common":[24,45],"whose":[26],"class":[27],"information":[28],"not":[30],"given.":[31],"In":[32,51,114,138,158],"task,":[34],"it":[35],"crucial":[37],"mine":[39],"reliable":[40],"temporal":[41,95,99],"cues":[42],"from":[47],"handful":[48],"videos.":[50,137],"our":[52,180],"work,":[53],"we":[54,65,86,160],"develop":[55,162],"an":[56],"attention":[57],"mechanism":[58],"cross-correlation.":[60],"Based":[61],"on":[62,168],"cross-attention,":[64],"first":[66],"transform":[67],"the":[68,106,112,117,126,135,140,144,151,169,177,183],"into":[71],"video\u2019s":[73],"context":[74],"emphasize":[76],"query-relevant":[77],"important":[78],"frames,":[79],"and":[80,132,171,191,193],"suppress":[81],"less":[82],"relevant":[83],"ones.":[84],"Next,":[85],"summarize":[87],"sub-sequences":[88],"frames":[92],"represent":[94],"dynamics":[96],"coarse":[98],"granularity,":[100],"which":[101],"then":[103],"propagated":[104],"fine-grained":[107],"features":[110],"through":[111],"cross-attention.":[113],"each":[115,122,195],"case,":[116],"cross-attentions":[118],"are":[119,147],"applied":[120],"individual-to-all":[127],"strategy":[128],"balance":[130],"heterogeneity":[131],"compatibility":[133],"contrast,":[139],"candidate":[141],"lastly":[148],"attended":[149],"by":[150],"resulting":[152],"features,":[155],"at":[156],"once.":[157],"addition,":[159],"also":[161],"relational":[164],"classifier":[165],"head":[166],"based":[167],"representations.":[174],"We":[175],"show":[176],"effectiveness":[178],"work":[181],"with":[182],"state-of-the-art":[184],"(SOTA)":[185],"performance":[186],"benchmark":[188],"datasets":[189],"(ActivityNet1.3":[190],"THUMOS14),":[192],"analyze":[194],"component":[196],"extensively.":[197]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
