{"id":"https://openalex.org/W7140807770","doi":"https://doi.org/10.48550/arxiv.2603.23710","title":"An In-Depth Study of Filter-Agnostic Vector Search on a PostgreSQL Database System: [Experiments and Analysis]","display_name":"An In-Depth Study of Filter-Agnostic Vector Search on a PostgreSQL Database System: [Experiments and Analysis]","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140807770","doi":"https://doi.org/10.48550/arxiv.2603.23710"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.23710","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23710","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.23710","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102305858","display_name":"Duo Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Duo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010142123","display_name":"Helena Caminal","orcid":"https://orcid.org/0000-0002-2052-8107"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Caminal, Helena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010978109","display_name":"Manos Chatzakis","orcid":"https://orcid.org/0000-0002-9616-6210"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chatzakis, Manos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059167302","display_name":"Yannis Papakonstantinou","orcid":"https://orcid.org/0009-0007-6360-9496"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Papakonstantinou, Yannis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035128721","display_name":"Yannis Chronis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chronis, Yannis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085553761","display_name":"Vaibhav Jain","orcid":"https://orcid.org/0000-0003-3515-1477"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jain, Vaibhav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130675113","display_name":"Fatma \u00d6zcan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u00d6zcan, Fatma","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.7455999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.7455999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.042399998754262924,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.0348999984562397,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.524399995803833},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5142999887466431},{"id":"https://openalex.org/keywords/database-theory","display_name":"Database theory","score":0.48019999265670776},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.4724999964237213},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4722000062465668},{"id":"https://openalex.org/keywords/database-design","display_name":"Database design","score":0.4165000021457672},{"id":"https://openalex.org/keywords/premise","display_name":"Premise","score":0.38449999690055847},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.37619999051094055}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7767999768257141},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.6902999877929688},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.524399995803833},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5142999887466431},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.48240000009536743},{"id":"https://openalex.org/C12439846","wikidata":"https://www.wikidata.org/wiki/Q4809258","display_name":"Database theory","level":3,"score":0.48019999265670776},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.4724999964237213},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4722000062465668},{"id":"https://openalex.org/C148840519","wikidata":"https://www.wikidata.org/wiki/Q1049878","display_name":"Database design","level":2,"score":0.4165000021457672},{"id":"https://openalex.org/C2778023277","wikidata":"https://www.wikidata.org/wiki/Q321703","display_name":"Premise","level":2,"score":0.38449999690055847},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.37619999051094055},{"id":"https://openalex.org/C78161392","wikidata":"https://www.wikidata.org/wiki/Q5227414","display_name":"Database testing","level":4,"score":0.35420000553131104},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.34869998693466187},{"id":"https://openalex.org/C107535962","wikidata":"https://www.wikidata.org/wiki/Q2459880","display_name":"Database tuning","level":4,"score":0.34549999237060547},{"id":"https://openalex.org/C54239708","wikidata":"https://www.wikidata.org/wiki/Q1329910","display_name":"View","level":3,"score":0.32850000262260437},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3091000020503998},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2833999991416931},{"id":"https://openalex.org/C5968703","wikidata":"https://www.wikidata.org/wiki/Q267136","display_name":"Database model","level":3,"score":0.27889999747276306},{"id":"https://openalex.org/C59276292","wikidata":"https://www.wikidata.org/wiki/Q580427","display_name":"Database index","level":3,"score":0.2745000123977661},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.25609999895095825},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2533999979496002},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.23710","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23710","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.23710","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23710","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Filtered":[0],"Vector":[1],"Search":[2],"(FVS)":[3],"is":[4,109,114,205],"critical":[5],"for":[6,200],"supporting":[7],"semantic":[8],"search":[9],"and":[10,61,95,104,134,140,162,192,220],"GenAI":[11],"applications":[12],"in":[13,24,46,71,178,227],"modern":[14],"database":[15,36,49,180,187,230],"systems.":[16,37],"However,":[17],"existing":[18],"research":[19],"most":[20],"often":[21,172],"evaluates":[22],"algorithms":[23,85],"specialized":[25],"libraries,":[26],"making":[27],"optimistic":[28],"assumptions":[29,53],"that":[30,45,64,110,125,128,149,196],"do":[31,54],"not":[32,55,115,206],"align":[33],"with":[34,166,189],"enterprise-grade":[35],"Our":[38,106],"work":[39],"challenges":[40],"this":[41],"premise":[42],"by":[43,117],"demonstrating":[44,195],"a":[47,87,99,144,201,210,228],"production-grade":[48],"system,":[50],"commonly":[51],"made":[52],"hold,":[56],"leading":[57],"to":[58],"performance":[59],"characteristics":[60,219],"algorithmic":[62],"trade-offs":[63],"are":[65],"fundamentally":[66],"different":[67],"from":[68,130],"those":[69],"observed":[70],"isolated":[72],"library":[73],"settings.":[74],"This":[75],"paper":[76],"presents":[77],"the":[78,111,118,186,197,215,221],"first":[79],"in-depth":[80],"analysis":[81],"of":[82,102,120,159,224],"filter-agnostic":[83,202],"FVS":[84,203],"within":[86],"production":[88],"PostgreSQL-compatible":[89],"system.":[90],"We":[91,147],"systematically":[92],"evaluate":[93],"post-filtering":[94],"inline-filtering":[96],"strategies":[97],"across":[98],"wide":[100],"range":[101],"selectivities":[103],"correlations.":[105],"central":[107],"finding":[108],"optimal":[112,198],"algorithm":[113,204],"dictated":[116],"cost":[119],"distance":[121,132],"computations":[122,133],"alone,":[123],"but":[124,208],"system-level":[126,163],"overheads":[127],"come":[129],"both":[131],"filter":[135,160],"operations":[136],"(like":[137],"page":[138],"accesses":[139],"data":[141,225],"retrieval)":[142],"play":[143],"significant":[145],"role.":[146],"demonstrate":[148],"graph-based":[150],"approaches":[151],"(such":[152],"as":[153,170],"NaviX/ACORN)":[154],"can":[155],"incur":[156],"prohibitive":[157],"numbers":[158],"checks":[161],"overheads,":[164],"compared":[165],"clustering-based":[167],"indexes":[168],"such":[169],"ScaNN,":[171],"canceling":[173],"out":[174],"their":[175],"theoretical":[176],"benefits":[177],"real-world":[179,229],"environments.":[181],"Ultimately,":[182],"our":[183],"findings":[184],"provide":[185],"community":[188],"crucial":[190],"insights":[191],"practical":[193],"guidelines,":[194],"choice":[199],"absolute,":[207],"rather":[209],"system-aware":[211],"decision":[212],"contingent":[213],"on":[214],"interplay":[216],"between":[217],"workload":[218],"underlying":[222],"costs":[223],"access":[226],"architecture.":[231]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-27T00:00:00"}
