{"id":"https://openalex.org/W7127422451","doi":"https://doi.org/10.48550/arxiv.2602.02057","title":"QVCache: A Query-Aware Vector Cache","display_name":"QVCache: A Query-Aware Vector Cache","publication_year":2026,"publication_date":"2026-02-02","ids":{"openalex":"https://openalex.org/W7127422451","doi":"https://doi.org/10.48550/arxiv.2602.02057"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.02057","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124943751","display_name":"An\u0131l Eren G\u00f6\u00e7er","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"G\u00f6\u00e7er, An\u0131l Eren","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095848478","display_name":"Ioanna Tsakalidou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsakalidou, Ioanna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024169695","display_name":"Hamish Nicholson","orcid":"https://orcid.org/0000-0003-0306-3253"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nicholson, Hamish","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055332840","display_name":"Kyoungmin Kim","orcid":"https://orcid.org/0009-0000-0224-2570"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Kyoungmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070907021","display_name":"Anastasia Ailamaki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ailamaki, Anastasia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.5184999704360962,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.5184999704360962,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.21150000393390656,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.12210000306367874,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.6654999852180481},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6283000111579895},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5597000122070312},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.415800005197525},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.4059000015258789},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.40529999136924744},{"id":"https://openalex.org/keywords/cas-latency","display_name":"CAS latency","score":0.35190001130104065},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.3456000089645386}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8489999771118164},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.6654999852180481},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6283000111579895},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5597000122070312},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.415800005197525},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.4059000015258789},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.40529999136924744},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.35760000348091125},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3547999858856201},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.35190001130104065},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.3456000089645386},{"id":"https://openalex.org/C5165142","wikidata":"https://www.wikidata.org/wiki/Q5432732","display_name":"False sharing","level":5,"score":0.34040001034736633},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.33309999108314514},{"id":"https://openalex.org/C141917322","wikidata":"https://www.wikidata.org/wiki/Q1025017","display_name":"Cache coherence","level":5,"score":0.31119999289512634},{"id":"https://openalex.org/C136085584","wikidata":"https://www.wikidata.org/wiki/Q910289","display_name":"Overlay","level":2,"score":0.30570000410079956},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.305400013923645},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C2777851325","wikidata":"https://www.wikidata.org/wiki/Q7094102","display_name":"Online model","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C133588205","wikidata":"https://www.wikidata.org/wiki/Q28455645","display_name":"Instruction prefetch","level":3,"score":0.2524999976158142},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.25130000710487366},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.25110000371932983}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.02057","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.02057","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.02057","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.02057","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vector":[0],"databases":[1],"have":[2],"become":[3],"a":[4,76,145,154,198],"cornerstone":[5],"of":[6,68,82,139],"modern":[7],"information":[8],"retrieval,":[9],"powering":[10],"applications":[11],"in":[12,70],"recommendation,":[13],"search,":[14],"and":[15,40,135,158],"retrieval-augmented":[16],"generation":[17],"(RAG)":[18],"pipelines.":[19],"However,":[20],"scaling":[21],"approximate":[22],"nearest":[23],"neighbor":[24],"(ANN)":[25],"search":[26,45,74,98],"to":[27,169,190],"high":[28,52],"recall":[29,188],"under":[30],"strict":[31],"latency":[32,49,134,166,185],"SLOs":[33],"remains":[34],"fundamentally":[35],"constrained":[36],"by":[37,108,167],"memory":[38,60,101,136,156],"capacity":[39],"I/O":[41],"bandwidth.":[42],"Disk-based":[43],"vector":[44,73,150,206],"systems":[46],"suffer":[47],"severe":[48],"degradation":[50],"at":[51,62],"accuracy,":[53],"while":[54,131,186],"fully":[55],"in-memory":[56],"solutions":[57],"incur":[58],"prohibitive":[59],"costs":[61],"billion-scale.":[63],"Despite":[64],"the":[65,90,191],"central":[66],"role":[67],"caching":[69,79,94,111,202],"traditional":[71],"databases,":[72],"lacks":[75],"general":[77],"query-level":[78,93],"layer":[80,147,203],"capable":[81],"amortizing":[83],"repeated":[84],"query":[85,106,165],"work.":[86],"We":[87],"present":[88],"QVCache,":[89],"first":[91],"backend-agnostic,":[92],"system":[95],"for":[96,148,204],"ANN":[97,175,193],"with":[99,173],"bounded":[100],"footprint.":[102],"QVCache":[103,142,182],"exploits":[104],"semantic":[105],"repetition":[107],"performing":[109],"similarity-aware":[110],"rather":[112],"than":[113],"exact-match":[114],"lookup.":[115],"It":[116,152],"dynamically":[117],"learns":[118],"region-specific":[119],"distance":[120],"thresholds":[121],"using":[122],"an":[123],"online":[124],"learning":[125],"algorithm,":[126],"enabling":[127],"recall-preserving":[128],"cache":[129],"hits":[130],"bounding":[132],"lookup":[133],"usage":[137],"independently":[138],"dataset":[140],"size.":[141],"operates":[143],"as":[144,197],"drop-in":[146],"existing":[149,174],"databases.":[151],"maintains":[153],"megabyte-scale":[155],"footprint":[157],"achieves":[159],"sub-millisecond":[160],"cache-hit":[161],"latency,":[162],"reducing":[163],"end-to-end":[164],"up":[168],"40-1000x":[170],"when":[171],"integrated":[172],"systems.":[176],"For":[177],"workloads":[178],"exhibiting":[179],"temporal-semantic":[180],"locality,":[181],"substantially":[183],"reduces":[184],"preserving":[187],"comparable":[189],"underlying":[192],"backend,":[194],"establishing":[195],"it":[196],"missing":[199],"but":[200],"essential":[201],"scalable":[205],"search.":[207]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-04T00:00:00"}
