{"id":"https://openalex.org/W7141726817","doi":"https://doi.org/10.48550/arxiv.2603.25072","title":"GIFT: Global Irreplaceability Frame Targeting for Efficient Video Understanding","display_name":"GIFT: Global Irreplaceability Frame Targeting for Efficient Video Understanding","publication_year":2026,"publication_date":"2026-03-26","ids":{"openalex":"https://openalex.org/W7141726817","doi":"https://doi.org/10.48550/arxiv.2603.25072"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.25072","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25072","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.25072","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130797111","display_name":"Junpeng Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Junpeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130809457","display_name":"Sashuai Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Sashuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130776926","display_name":"Guanghao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Guanghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130731737","display_name":"Xin Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130805222","display_name":"Yue Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130758226","display_name":"Hengyu Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Hengyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130746340","display_name":"Yuxiang Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Yuxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130775160","display_name":"Zhibin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhibin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130726031","display_name":"Jun Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130785335","display_name":"Bo Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Bo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130799635","display_name":"Shanghang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shanghang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130796536","display_name":"Jian Pu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pu, Jian","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5130797111"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8285999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8285999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0649000033736229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.03060000017285347,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6521000266075134},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6442999839782715},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6349999904632568},{"id":"https://openalex.org/keywords/uniqueness","display_name":"Uniqueness","score":0.46959999203681946},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46560001373291016},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.4262999892234802}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7954999804496765},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6521000266075134},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6442999839782715},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6349999904632568},{"id":"https://openalex.org/C2777021972","wikidata":"https://www.wikidata.org/wiki/Q22976830","display_name":"Uniqueness","level":2,"score":0.46959999203681946},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.4262999892234802},{"id":"https://openalex.org/C51823790","wikidata":"https://www.wikidata.org/wiki/Q504353","display_name":"Greedy algorithm","level":2,"score":0.4260999858379364},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.41110000014305115},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3379000127315521},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3149999976158142},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3010999858379364},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2948000133037567},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.28679999709129333},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.263700008392334},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.26080000400543213}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.25072","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25072","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.25072","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25072","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7400804162025452,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"Large":[1],"Language":[2],"Models":[3],"(VLMs)":[4],"have":[5],"achieved":[6],"remarkable":[7],"success":[8],"in":[9,53],"video":[10,158],"understanding,":[11],"but":[12,33],"the":[13,124,141],"significant":[14],"computational":[15],"cost":[16],"from":[17],"processing":[18],"dense":[19],"frames":[20,76,122],"severely":[21],"limits":[22],"their":[23,34,79],"practical":[24],"application.":[25],"Existing":[26],"methods":[27],"alleviate":[28],"this":[29],"by":[30,77],"selecting":[31,55],"keyframes,":[32],"greedy":[35],"decision-making,":[36],"combined":[37],"with":[38,123],"a":[39,70,90,101,111,118,150],"decoupled":[40],"evaluation":[41],"of":[42,121,154],"relevance":[43],"and":[44,51,127],"diversity,":[45],"often":[46],"falls":[47],"into":[48],"local":[49],"optima":[50],"results":[52],"erroneously":[54],"irrelevant":[56],"noise":[57],"frames.":[58],"To":[59],"address":[60],"these":[61,138],"challenges,":[62],"we":[63,83],"propose":[64],"GIFT:":[65],"Global":[66],"Irreplaceability":[67],"Frame":[68],"Targeting,":[69],"novel":[71],"training-free":[72],"framework":[73],"that":[74,115,147],"selects":[75],"assessing":[78],"intrinsic":[80],"irreplaceability.":[81],"Specifically,":[82],"first":[84,116],"introduce":[85],"Directed":[86],"Diversity":[87],"to":[88,99,132,163],"quantify":[89],"frame's":[91],"uniqueness":[92],"conditioned":[93],"on":[94,160],"relevance,":[95],"which":[96],"allows":[97],"us":[98],"formulate":[100],"unified":[102],"irreplaceability":[103],"score.":[104],"Subsequently,":[105],"our":[106],"Budget-Aware":[107],"Refinement":[108],"strategy":[109],"employs":[110],"adaptive":[112],"iterative":[113],"process":[114],"secures":[117],"core":[119],"set":[120],"highest":[125],"irreplaceability,":[126],"then":[128],"shifts":[129],"its":[130],"priority":[131],"building":[133],"crucial":[134],"temporal":[135],"context":[136],"around":[137],"selections":[139],"as":[140],"budget":[142],"expands.":[143],"Extensive":[144],"experiments":[145],"demonstrate":[146],"GIFT":[148],"achieves":[149],"maximum":[151],"average":[152],"improvement":[153],"12.5%":[155],"across":[156],"long-form":[157],"benchmarks":[159],"LLaVA-Video-7B":[161],"compared":[162],"uniform":[164],"sampling.":[165]},"counts_by_year":[],"updated_date":"2026-03-28T06:16:51.555046","created_date":"2026-03-28T00:00:00"}
