{"id":"https://openalex.org/W7106827576","doi":"https://doi.org/10.48550/arxiv.2511.19928","title":"Context-Aware Token Pruning and Discriminative Selective Attention for Transformer Tracking","display_name":"Context-Aware Token Pruning and Discriminative Selective Attention for Transformer Tracking","publication_year":2025,"publication_date":"2025-11-25","ids":{"openalex":"https://openalex.org/W7106827576","doi":"https://doi.org/10.48550/arxiv.2511.19928"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2511.19928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2511.19928","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Kugarajeevan, Janani","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kugarajeevan, Janani","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kokul, Thanikasalam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kokul, Thanikasalam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ramanan, Amirthalingam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramanan, Amirthalingam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Fernando, Subha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fernando, Subha","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.003800000064074993,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.002899999963119626,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8489000201225281},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.817799985408783},{"id":"https://openalex.org/keywords/bittorrent-tracker","display_name":"BitTorrent tracker","score":0.5724999904632568},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5687999725341797},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48809999227523804},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.4456999897956848},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4018000066280365}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8489000201225281},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.817799985408783},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7642999887466431},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5874000191688538},{"id":"https://openalex.org/C57501372","wikidata":"https://www.wikidata.org/wiki/Q2021268","display_name":"BitTorrent tracker","level":3,"score":0.5724999904632568},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5687999725341797},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48809999227523804},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.4456999897956848},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4018000066280365},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.38749998807907104},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3366999924182892},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.3260999917984009},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.2597000002861023},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.25690001249313354},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2511.19928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2511.19928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7897699475288391}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"One-stream":[0],"Transformer-based":[1],"trackers":[2],"have":[3,46],"demonstrated":[4],"remarkable":[5],"performance":[6,217],"by":[7],"concatenating":[8],"template":[9,35,201],"and":[10,69,109,209],"search":[11,28,80,133,151],"region":[12,152,196],"tokens,":[13,202],"thereby":[14,203],"enabling":[15,22],"joint":[16],"attention":[17,169,177],"across":[18,218],"all":[19],"tokens.":[20,211],"However,":[21],"an":[23,227],"excessive":[24],"proportion":[25],"of":[26,65,76,131,207,230],"background":[27,51,108,145,164,208],"tokens":[29,36,57,81,111,146,189],"to":[30,32,49,62,87,104,127,197,199],"attend":[31,198],"the":[33,38,59,63,74,79,84,90,129,138,150,155,159,179,183,200,205],"target":[34,188],"weakens":[37],"tracker's":[39,85],"discriminative":[40,167],"capability.":[41],"Several":[42],"token":[43,134],"pruning":[44],"methods":[45],"been":[47],"proposed":[48,213],"mitigate":[50],"interference;":[52],"however,":[53],"they":[54],"often":[55],"remove":[56],"near":[58],"target,":[60],"leading":[61],"loss":[64],"essential":[66],"contextual":[67,156],"information":[68],"degraded":[70],"tracking":[71,101],"performance.":[72],"Moreover,":[73],"presence":[75],"distractors":[77],"within":[78],"further":[82,162],"reduces":[83],"ability":[86],"accurately":[88],"identify":[89],"target.":[91,139,160],"To":[92,161],"address":[93],"these":[94,142],"limitations,":[95],"we":[96],"propose":[97],"CPDATrack,":[98],"a":[99,117,166,194],"novel":[100],"framework":[102],"designed":[103],"suppress":[105,163],"interference":[106],"from":[107,149,193],"distractor":[110,210],"while":[112,153],"enhancing":[113],"computational":[114],"efficiency.":[115],"First,":[116],"learnable":[118],"module":[119],"is":[120,171],"integrated":[121],"between":[122],"two":[123],"designated":[124],"encoder":[125,185],"layers":[126],"estimate":[128],"probability":[130],"each":[132],"being":[135],"associated":[136],"with":[137],"Based":[140],"on":[141,222],"estimates,":[143],"less-informative":[144],"are":[147,190],"pruned":[148],"preserving":[154],"cues":[157],"surrounding":[158],"interference,":[165],"selective":[168],"mechanism":[170],"employed":[172],"that":[173],"fully":[174],"blocks":[175],"search-to-template":[176],"in":[178],"early":[180],"layers.":[181],"In":[182],"subsequent":[184],"layers,":[186],"high-probability":[187],"selectively":[191],"extracted":[192],"localized":[195],"reducing":[204],"influence":[206],"The":[212],"CPDATrack":[214],"achieves":[215],"state-of-the-art":[216],"multiple":[219],"benchmarks,":[220],"particularly":[221],"GOT-10k,":[223],"where":[224],"it":[225],"attains":[226],"average":[228],"overlap":[229],"75.1":[231],"percent.":[232]},"counts_by_year":[],"updated_date":"2025-11-28T02:12:24.556248","created_date":"2025-11-28T00:00:00"}
