{"id":"https://openalex.org/W7082978957","doi":"https://doi.org/10.1145/3749167","title":"HARMONY: A Scalable Distributed Vector Database for High-Throughput Approximate Nearest Neighbor Search","display_name":"HARMONY: A Scalable Distributed Vector Database for High-Throughput Approximate Nearest Neighbor Search","publication_year":2025,"publication_date":"2025-09-22","ids":{"openalex":"https://openalex.org/W7082978957","doi":"https://doi.org/10.1145/3749167"},"language":"en","primary_location":{"id":"doi:10.1145/3749167","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3749167","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Qian Xu","orcid":"https://orcid.org/0009-0000-3276-3262"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qian Xu","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-3276-3262","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Feng Zhang","orcid":"https://orcid.org/0000-0003-1983-7321"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Zhang","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1983-7321","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chengxi Li","orcid":"https://orcid.org/0009-0002-8493-6238"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengxi Li","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-8493-6238","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lei Cao","orcid":"https://orcid.org/0000-0001-9909-8607"},"institutions":[{"id":"https://openalex.org/I4210139712","display_name":"American Samoa Government","ror":"https://ror.org/03t879f74","country_code":"AS","type":"government","lineage":["https://openalex.org/I4210139712"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["AS","US"],"is_corresponding":false,"raw_author_name":"Lei Cao","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, American Samoa"],"raw_orcid":"https://orcid.org/0000-0001-9909-8607","affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, American Samoa","institution_ids":["https://openalex.org/I63966007","https://openalex.org/I4210139712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zheng Chen","orcid":"https://orcid.org/0009-0000-8342-9504"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Chen","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-8342-9504","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jidong Zhai","orcid":"https://orcid.org/0000-0002-7656-6428"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jidong Zhai","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7656-6428","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":null,"display_name":"Xiaoyong Du","orcid":"https://orcid.org/0000-0002-5757-9135"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyong Du","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5757-9135","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":6.5198,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96786051,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"3","issue":"4","first_page":"1","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6625999808311462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6625999808311462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13067","display_name":"Geological Modeling and Analysis","score":0.03180000185966492,"subfield":{"id":"https://openalex.org/subfields/1906","display_name":"Geochemistry and Petrology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14311","display_name":"Electrical and Electromagnetic Research","score":0.019500000402331352,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6747999787330627},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.5461000204086304},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.4555000066757202},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.4496999979019165},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.44670000672340393},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.42179998755455017},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4007999897003174},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.36890000104904175}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7885000109672546},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6747999787330627},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.5461000204086304},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.45179998874664307},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.4496999979019165},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.44670000672340393},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.42179998755455017},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4007999897003174},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3896999955177307},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.36890000104904175},{"id":"https://openalex.org/C33099171","wikidata":"https://www.wikidata.org/wiki/Q26208718","display_name":"Harmony search","level":2,"score":0.3628999888896942},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C138959212","wikidata":"https://www.wikidata.org/wiki/Q1806783","display_name":"Load balancing (electrical power)","level":3,"score":0.3492000102996826},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.3285999894142151},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2888000011444092},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.27149999141693115},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3749167","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3749167","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1970319631","https://openalex.org/W1972115340","https://openalex.org/W1978475816","https://openalex.org/W1980090536","https://openalex.org/W1982063824","https://openalex.org/W2086504823","https://openalex.org/W2110026675","https://openalex.org/W2132234208","https://openalex.org/W2133995768","https://openalex.org/W2165558283","https://openalex.org/W2171572695","https://openalex.org/W2171790913","https://openalex.org/W2173213060","https://openalex.org/W2411707397","https://openalex.org/W2612493630","https://openalex.org/W2963213349","https://openalex.org/W2963284996","https://openalex.org/W3012754345","https://openalex.org/W3031031108","https://openalex.org/W3087592560","https://openalex.org/W3166125679","https://openalex.org/W3174809957","https://openalex.org/W3175777295","https://openalex.org/W4221159373","https://openalex.org/W4235797544","https://openalex.org/W4321446313","https://openalex.org/W4381329139","https://openalex.org/W4387321071","https://openalex.org/W4389491850","https://openalex.org/W4394744600","https://openalex.org/W4399175194","https://openalex.org/W4401352035","https://openalex.org/W4402435501","https://openalex.org/W4407357002","https://openalex.org/W4409310868","https://openalex.org/W4411403229","https://openalex.org/W4411403501","https://openalex.org/W6922057760"],"related_works":[],"abstract_inverted_index":{"Approximate":[0],"Nearest":[1],"Neighbor":[2],"Search":[3],"(ANNS)":[4],"is":[5],"essential":[6],"for":[7,50,180],"various":[8],"data-intensive":[9],"applications,":[10],"including":[11],"recommendation":[12],"systems,":[13],"image":[14],"retrieval,":[15],"and":[16,37,54,66,102,146,173],"machine":[17,30],"learning.":[18],"Scaling":[19],"ANNS":[20,91],"to":[21,72,78],"handle":[22],"billions":[23],"of":[24,56,111,133],"high-dimensional":[25],"vectors":[26],"on":[27,153,168],"a":[28,89,95,108],"single":[29],"presents":[31],"significant":[32,141],"challenges":[33],"in":[34,136,140,143,170],"memory":[35],"capacity":[36],"processing":[38,55],"efficiency.":[39],"To":[40],"address":[41],"these":[42],"challenges,":[43],"distributed":[44,90,162],"vector":[45,163],"databases":[46],"leverage":[47],"multiple":[48],"nodes":[49,116,172],"the":[51,81,131],"parallel":[52],"storage":[53],"vectors.":[57],"However,":[58],"existing":[59],"solutions":[60],"often":[61],"suffer":[62],"from":[63],"load":[64,113],"imbalance":[65],"high":[67],"communication":[68,120,147],"overhead,":[69],"primarily":[70],"due":[71],"traditional":[73,178],"partition":[74,98],"strategies":[75],"that":[76,93,129,158],"fail":[77],"effectively":[79,118],"distribute":[80],"workload.":[82],"In":[83],"this":[84],"paper,":[85],"we":[86],"introduce":[87],"Harmony,":[88],"system":[92],"employs":[94],"novel":[96],"multi-granularity":[97],"strategy,":[99],"combining":[100],"dimension-based":[101,137],"vector-based":[103],"partition.":[104],"This":[105],"strategy":[106],"ensures":[107],"balanced":[109],"distribution":[110,179],"computational":[112,145],"across":[114],"all":[115],"while":[117],"minimizing":[119],"costs.":[121],"Furthermore,":[122],"Harmony":[123,159],"incorporates":[124],"an":[125],"early-stop":[126],"pruning":[127],"mechanism":[128],"leverages":[130],"monotonicity":[132],"distance":[134],"computations":[135],"partition,":[138],"resulting":[139],"reductions":[142],"both":[144],"overhead.":[148],"We":[149],"conducted":[150],"extensive":[151],"experiments":[152],"diverse":[154],"real-world":[155],"datasets,":[156],"demonstrating":[157],"outperforms":[160],"leading":[161],"databases,":[164],"achieving":[165],"4.63\u00d7":[166],"throughput":[167],"average":[169],"four":[171],"58%":[174],"performance":[175],"improvement":[176],"over":[177],"skewed":[181],"workloads.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
