{"id":"https://openalex.org/W7154983911","doi":"https://doi.org/10.48550/arxiv.2604.15583","title":"SAGE: Selective Attention-Guided Extraction for Token-Efficient Document Indexing","display_name":"SAGE: Selective Attention-Guided Extraction for Token-Efficient Document Indexing","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7154983911","doi":"https://doi.org/10.48550/arxiv.2604.15583"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.15583","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134054637","display_name":"Xinzhi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xinzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134052386","display_name":"Peter Baile Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Peter Baile","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134076237","display_name":"Gerardo Vitagliano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vitagliano, Gerardo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113228367","display_name":"Matthew Russo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Russo, Matthew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134071236","display_name":"Jun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039133265","display_name":"Michael Cafarella","orcid":"https://orcid.org/0000-0001-6122-0590"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cafarella, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037742794","display_name":"Samuel Madden","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Madden, Samuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134060484","display_name":"Chunwei Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Chunwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8633000254631042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8633000254631042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.03720000013709068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.010400000028312206,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.7106000185012817},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6643000245094299},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6590999960899353},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.6353999972343445},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5935999751091003},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.49720001220703125},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.47049999237060547},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.40610000491142273},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3944999873638153}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8012999892234802},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.7106000185012817},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6643000245094299},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6590999960899353},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.6353999972343445},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5935999751091003},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.49720001220703125},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.47049999237060547},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44339999556541443},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.41429999470710754},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.40610000491142273},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3944999873638153},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.36910000443458557},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.3668000102043152},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.35440000891685486},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.3409999907016754},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3359000086784363},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.3165000081062317},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.30550000071525574},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3034999966621399},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.30320000648498535},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C153914771","wikidata":"https://www.wikidata.org/wiki/Q5227343","display_name":"Data reduction","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26260000467300415},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.15583","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15583","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1,111],"models":[2],"with":[3,188],"long":[4,52],"context":[5,94,149,179],"windows":[6],"can":[7,28,63],"answer":[8,30,155],"complex":[9,198],"questions":[10,50],"directly":[11],"from":[12],"full-length":[13],"academic,":[14],"technical,":[15],"and":[16,27,58,70,79,109,144],"policy":[17],"documents,":[18],"but":[19],"passing":[20],"entire":[21],"documents":[22],"is":[23],"often":[24,76],"costly,":[25],"slow,":[26],"degrade":[29],"quality":[31],"while":[32,174],"increasing":[33],"the":[34,43,136,192],"risk":[35],"of":[36,46,82],"unnecessary":[37],"data":[38],"leakage.":[39],"This":[40,181],"paper":[41],"targets":[42],"common":[44],"setting":[45],"answering":[47],"many":[48],"heterogeneous":[49],"over":[51],"document(s),":[53],"where":[54],"fixed":[55],"position":[56],"heuristics":[57],"standard":[59],"retrieval-augmented":[60],"generation":[61],"(RAG)":[62],"fail":[64],"due":[65],"to":[66,103,129,150,176],"document":[67],"structure":[68],"variability":[69],"weak":[71],"query-chunk":[72],"semantic":[73],"similarity,":[74],"which":[75],"requires":[77],"task-":[78],"domain-specific":[80],"tuning":[81],"embedding":[83],"retrievers.":[84],"We":[85],"propose":[86],"{Selective":[87],"Attention-Guided":[88],"Extraction}":[89],"(\\ourmethod),":[90],"a":[91,99,105,116,140,151,169,177,183],"training-free,":[92],"plug-and-play":[93],"reduction":[95,160,185],"framework":[96],"that":[97],"uses":[98],"lightweight":[100],"local":[101],"LLM":[102,153],"perform":[104],"single":[106],"prefilling":[107],"pass":[108],"convert":[110],"model":[112,195],"attention":[113],"signals":[114],"into":[115],"query-specific":[117],"relevance":[118],"heatmap":[119],"at":[120],"configurable":[121],"granularities.":[122],"\\ourmethod\\":[123,157],"further":[124],"introduces":[125],"\\emph{differential":[126],"attention}":[127],"strategies":[128],"better":[130],"isolate":[131],"question-relevant":[132],"evidence,":[133],"then":[134],"selects":[135],"top-scoring":[137],"units":[138],"under":[139],"user-defined":[141],"token":[142],"budget":[143],"forwards":[145],"only":[146],"this":[147],"reduced":[148],"downstream":[152],"for":[154,194],"generation.":[156],"surpasses":[158],"traditional":[159],"techniques":[161],"across":[162],"multiple":[163],"long-document":[164],"QA":[165],"benchmarks,":[166],"notably":[167],"securing":[168],"top-4":[170],"rank":[171],"on":[172],"QuALITY-hard":[173],"constrained":[175],"10\\%":[178],"budget.":[180],"enables":[182],"90\\%":[184],"in":[186],"tokens":[187],"competitive":[189],"accuracy,":[190],"without":[191],"need":[193],"fine-tuning":[196],"or":[197],"calibration.":[199]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-21T00:00:00"}
