{"id":"https://openalex.org/W4415378696","doi":"https://doi.org/10.5753/sbbd.2025.247245","title":"KV-RAPTOR: Scalable Tree-Structured Retrieval with KV Cache Compression for Question-Answering Systems","display_name":"KV-RAPTOR: Scalable Tree-Structured Retrieval with KV Cache Compression for Question-Answering Systems","publication_year":2025,"publication_date":"2025-09-29","ids":{"openalex":"https://openalex.org/W4415378696","doi":"https://doi.org/10.5753/sbbd.2025.247245"},"language":null,"primary_location":{"id":"doi:10.5753/sbbd.2025.247245","is_oa":true,"landing_page_url":"https://doi.org/10.5753/sbbd.2025.247245","pdf_url":"https://sol.sbc.org.br/index.php/sbbd/article/download/37247/37030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Anais do XL Simp\u00f3sio Brasileiro de Banco de Dados (SBBD 2025)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://sol.sbc.org.br/index.php/sbbd/article/download/37247/37030","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jo\u00e3o Gabriel J. da Silva","orcid":"https://orcid.org/0009-0009-7801-7463"},"institutions":[{"id":"https://openalex.org/I68106152","display_name":"Universidade Federal de Goi\u00e1s","ror":"https://ror.org/0039d5757","country_code":"BR","type":"education","lineage":["https://openalex.org/I68106152"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Jo\u00e3o Gabriel J. da Silva","raw_affiliation_strings":["Federal University of Goi\u00e1s (UFG)"],"raw_orcid":"https://orcid.org/0009-0009-7801-7463","affiliations":[{"raw_affiliation_string":"Federal University of Goi\u00e1s (UFG)","institution_ids":["https://openalex.org/I68106152"]}]},{"author_position":"middle","author":{"id":null,"display_name":"S\u00e1vio S. T. de Oliveira","orcid":null},"institutions":[{"id":"https://openalex.org/I68106152","display_name":"Universidade Federal de Goi\u00e1s","ror":"https://ror.org/0039d5757","country_code":"BR","type":"education","lineage":["https://openalex.org/I68106152"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"S\u00e1vio S. T. de Oliveira","raw_affiliation_strings":["Federal University of Goi\u00e1s (UFG)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Federal University of Goi\u00e1s (UFG)","institution_ids":["https://openalex.org/I68106152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053920470","display_name":"Lucas Alexandria Alves","orcid":null},"institutions":[{"id":"https://openalex.org/I68106152","display_name":"Universidade Federal de Goi\u00e1s","ror":"https://ror.org/0039d5757","country_code":"BR","type":"education","lineage":["https://openalex.org/I68106152"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Lucas Alexandria Alves","raw_affiliation_strings":["Federal University of Goi\u00e1s (UFG)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Federal University of Goi\u00e1s (UFG)","institution_ids":["https://openalex.org/I68106152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120077044","display_name":"Nicol\u00e1s Eiris","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160924","display_name":"Universidad Panamericana","ror":"https://ror.org/05pd6sh18","country_code":"GT","type":"education","lineage":["https://openalex.org/I4210160924"]}],"countries":["GT"],"is_corresponding":false,"raw_author_name":"Nicol\u00e1s Eiris","raw_affiliation_strings":["Panoplai"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Panoplai","institution_ids":["https://openalex.org/I4210160924"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080739504","display_name":"Arlindo Rodrigues Galv\u00e3o Filho","orcid":"https://orcid.org/0000-0003-2151-8039"},"institutions":[{"id":"https://openalex.org/I68106152","display_name":"Universidade Federal de Goi\u00e1s","ror":"https://ror.org/0039d5757","country_code":"BR","type":"education","lineage":["https://openalex.org/I68106152"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Arlindo R. Galv\u00e3o Filho","raw_affiliation_strings":["Federal University of Goi\u00e1s (UFG)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Federal University of Goi\u00e1s (UFG)","institution_ids":["https://openalex.org/I68106152"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14024673,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"316","last_page":"329"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6363999843597412},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.5497000217437744},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5422999858856201},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5019999742507935},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.48019999265670776},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.43939998745918274}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.836899995803833},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6363999843597412},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.5497000217437744},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5422999858856201},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5019999742507935},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.48019999265670776},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.43939998745918274},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.31929999589920044},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.31779998540878296},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3098999857902527},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.2818000018596649},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.2745000123977661},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.2728999853134155},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.25200000405311584},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5753/sbbd.2025.247245","is_oa":true,"landing_page_url":"https://doi.org/10.5753/sbbd.2025.247245","pdf_url":"https://sol.sbc.org.br/index.php/sbbd/article/download/37247/37030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Anais do XL Simp\u00f3sio Brasileiro de Banco de Dados (SBBD 2025)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.5753/sbbd.2025.247245","is_oa":true,"landing_page_url":"https://doi.org/10.5753/sbbd.2025.247245","pdf_url":"https://sol.sbc.org.br/index.php/sbbd/article/download/37247/37030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Anais do XL Simp\u00f3sio Brasileiro de Banco de Dados (SBBD 2025)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321992","display_name":"Minist\u00e9rio da Ci\u00eancia, Tecnologia e Inova\u00e7\u00e3o","ror":"https://ror.org/050zdnc69"},{"id":"https://openalex.org/F4320323732","display_name":"Companhia Energ\u00e9tica de Minas Gerais","ror":"https://ror.org/02kbrsj34"},{"id":"https://openalex.org/F4320324178","display_name":"Ag\u00eancia Nacional de Energia El\u00e9trica","ror":"https://ror.org/049sgh675"},{"id":"https://openalex.org/F4320330107","display_name":"Empresa Brasileira de Pesquisa e Inova\u00e7\u00e3o Industrial","ror":null}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415378696.pdf"},"referenced_works_count":14,"referenced_works":["https://openalex.org/W2101105183","https://openalex.org/W2133512280","https://openalex.org/W2963963993","https://openalex.org/W2970641574","https://openalex.org/W3046522182","https://openalex.org/W3096266342","https://openalex.org/W3210652142","https://openalex.org/W4401176373","https://openalex.org/W4403396872","https://openalex.org/W4403816579","https://openalex.org/W4406771321","https://openalex.org/W4408848702","https://openalex.org/W4409131852","https://openalex.org/W4412887830"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"KV-RAPTOR,":[3],"a":[4,24],"latency-optimized":[5],"variant":[6],"of":[7],"the":[8],"RAPTOR":[9],"(Recursive":[10],"Abstractive":[11],"Processing":[12],"for":[13,17],"Tree-Organized":[14],"Retrieval)":[15],"pipeline":[16],"Retrieval-Augmented":[18],"Generation":[19],"(RAG).":[20],"By":[21],"integrating":[22],"CacheGen,":[23],"compressed":[25],"key-value":[26],"(KV)":[27],"cache":[28],"reuse":[29],"mechanism,":[30],"into":[31],"RAPTOR\u2019s":[32],"tree-based":[33],"index,":[34],"we":[35],"demonstrate":[36],"that":[37],"it":[38],"is":[39],"possible":[40],"to":[41],"reduce":[42],"generation":[43],"latency":[44,66],"without":[45],"sacrificing":[46],"answer":[47],"quality.":[48],"We":[49],"evaluate":[50],"our":[51],"method":[52],"on":[53],"both":[54],"English":[55],"and":[56,64,73],"Portuguese":[57],"datasets,":[58],"showing":[59],"consistent":[60],"reductions":[61],"in":[62],"time-to-first-token":[63],"end-to-end":[65],"while":[67],"preserving":[68],"performance":[69],"across":[70],"diverse":[71],"linguistic":[72],"retrieval":[74],"contexts.":[75]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-21T00:00:00"}
