{"id":"https://openalex.org/W7131895607","doi":"https://doi.org/10.48550/arxiv.2602.22805","title":"Optimizing SSD-Resident Graph Indexing for High-Throughput Vector Search","display_name":"Optimizing SSD-Resident Graph Indexing for High-Throughput Vector Search","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131895607","doi":"https://doi.org/10.48550/arxiv.2602.22805"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.22805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.22805","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127360936","display_name":"Weichen Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhao, Weichen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036989019","display_name":"Yuncheng Lu","orcid":"https://orcid.org/0000-0003-0465-942X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Yuncheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122168527","display_name":"Yao Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Yao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127030073","display_name":"Hao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127188230","display_name":"Jiehui Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jiehui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126983463","display_name":"Minghao Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Minghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127351838","display_name":"Yakun Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yakun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127425822","display_name":"Weining Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Weining","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5127360936"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9128999710083008,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9128999710083008,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.021900000050663948,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12326","display_name":"Network Packet Processing and Optimization","score":0.012900000438094139,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5503000020980835},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.5486999750137329},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5138000249862671},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5029000043869019},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.44530001282691956},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.44429999589920044},{"id":"https://openalex.org/keywords/auxiliary-memory","display_name":"Auxiliary memory","score":0.36579999327659607},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.35260000824928284},{"id":"https://openalex.org/keywords/computer-data-storage","display_name":"Computer data storage","score":0.33869999647140503}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8517000079154968},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5503000020980835},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.5486999750137329},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5302000045776367},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5138000249862671},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5029000043869019},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4510999917984009},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.44530001282691956},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.44429999589920044},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.35260000824928284},{"id":"https://openalex.org/C194739806","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Computer data storage","level":2,"score":0.33869999647140503},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3382999897003174},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.3366999924182892},{"id":"https://openalex.org/C32587265","wikidata":"https://www.wikidata.org/wiki/Q1182260","display_name":"Data deduplication","level":2,"score":0.32519999146461487},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.31209999322891235},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.311599999666214},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C28034677","wikidata":"https://www.wikidata.org/wiki/Q17092530","display_name":"Interleaving","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.28790000081062317},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.27799999713897705},{"id":"https://openalex.org/C19012869","wikidata":"https://www.wikidata.org/wiki/Q578372","display_name":"Response time","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C24885549","wikidata":"https://www.wikidata.org/wiki/Q339678","display_name":"Distributed data store","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.26809999346733093},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.22805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.22805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graph-based":[0],"approximate":[1],"nearest":[2],"neighbor":[3],"search":[4,164,173],"(ANNS)":[5],"methods":[6],"(e.g.,":[7],"HNSW)":[8],"have":[9],"become":[10],"the":[11,16,94,113,199],"de":[12],"facto":[13],"state":[14],"of":[15,115,155,201,207],"art":[17],"for":[18,149],"their":[19,208],"high":[20],"precision":[21],"and":[22,49,75,84,100,161,191],"low":[23],"latency.":[24],"To":[25,134],"scale":[26],"beyond":[27],"main":[28],"memory,":[29,124],"recent":[30],"out-of-memory":[31],"ANNS":[32],"systems":[33,184,203],"leverage":[34],"SSDs":[35],"to":[36,89,166,187],"store":[37],"large":[38],"vector":[39],"indexes.":[40],"However,":[41],"they":[42],"still":[43],"suffer":[44],"from":[45],"severe":[46],"CPU":[47,136],"underutilization":[48],"read":[50],"amplification":[51],"(i.e.,":[52],"storage":[53,68],"stalls)":[54],"caused":[55],"by":[56,118,185],"limited":[57],"access":[58],"locality":[59],"during":[60,139],"graph":[61],"traversal.":[62],"We":[63,102],"present":[64],"VeloANN,":[65],"which":[66],"mitigates":[67],"stalls":[69],"through":[70],"a":[71,76,105,116,145,162],"locality-aware":[72],"data":[73,86],"layout":[74],"coroutine-based":[77,146],"asynchronous":[78,147,159],"runtime.":[79],"VeloANN":[80,143,179],"utilizes":[81],"hierarchical":[82],"compression":[83],"affinity-based":[85],"placement":[87],"scheme":[88],"co-locate":[90],"related":[91],"vectors":[92],"within":[93],"same":[95],"page,":[96],"effectively":[97],"reducing":[98],"fragmentation":[99],"over-fetching.":[101],"further":[103],"design":[104],"record-level":[106],"buffer":[107],"pool,":[108],"where":[109],"each":[110],"record":[111],"groups":[112],"neighbors":[114],"vector;":[117],"persistently":[119],"retaining":[120],"hot":[121],"records":[122],"in":[123,189,193],"it":[125,157],"eliminates":[126],"excessive":[127],"page":[128],"swapping":[129],"under":[130],"constrained":[131],"memory":[132,209],"budgets.":[133],"minimize":[135],"scheduling":[137],"overheads":[138],"disk":[140],"I/O":[141],"interruptions,":[142],"employs":[144],"runtime":[148],"lightweight":[150],"task":[151],"scheduling.":[152],"On":[153],"top":[154],"this,":[156],"incorporates":[158],"prefetching":[160],"beam-aware":[163],"strategy":[165],"prioritize":[167],"cached":[168],"data,":[169],"ultimately":[170],"improving":[171],"overall":[172],"efficiency.":[174],"Extensive":[175],"experiments":[176],"show":[177],"that":[178],"outperforms":[180],"state-of-the-art":[181],"disk-based":[182],"ANN":[183],"up":[186],"5.8x":[188],"throughput":[190,200],"3.25x":[192],"latency":[194],"reduction,":[195],"while":[196],"achieving":[197],"0.92x":[198],"in-memory":[202],"using":[204],"only":[205],"10%":[206],"footprint.":[210]},"counts_by_year":[],"updated_date":"2026-02-28T06:18:59.386488","created_date":"2026-02-28T00:00:00"}
