{"id":"https://openalex.org/W4281387537","doi":"https://doi.org/10.1145/3530800.3534532","title":"Efficient approximate search for sets of lineage vectors","display_name":"Efficient approximate search for sets of lineage vectors","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4281387537","doi":"https://doi.org/10.1145/3530800.3534532"},"language":"en","primary_location":{"id":"doi:10.1145/3530800.3534532","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3530800.3534532","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th International Workshop on the Theory and Practice of Provenance","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030332092","display_name":"Michael Leybovich","orcid":null},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Michael Leybovich","raw_affiliation_strings":["Technion, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Technion, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047193562","display_name":"Oded Shmueli","orcid":"https://orcid.org/0000-0003-4304-310X"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Oded Shmueli","raw_affiliation_strings":["Technion, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Technion, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5030332092"],"corresponding_institution_ids":["https://openalex.org/I174306211"],"apc_list":null,"apc_paid":null,"fwci":0.1007,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.35341695,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9745000004768372,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9674999713897705,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.6391115784645081},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.6040568351745605},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.5427366495132446},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.5331677198410034},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.5092614889144897},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.47785255312919617},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.4667074382305145},{"id":"https://openalex.org/keywords/euclidean-distance","display_name":"Euclidean distance","score":0.4439443349838257},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.4413510859012604},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.42543643712997437},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4127046763896942},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40880194306373596},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.39532679319381714},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.31409555673599243},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.30713656544685364},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.24362608790397644},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19685155153274536},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.18683260679244995},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.163884699344635}],"concepts":[{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.6391115784645081},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.6040568351745605},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5427366495132446},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.5331677198410034},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.5092614889144897},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.47785255312919617},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.4667074382305145},{"id":"https://openalex.org/C120174047","wikidata":"https://www.wikidata.org/wiki/Q847073","display_name":"Euclidean distance","level":2,"score":0.4439443349838257},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.4413510859012604},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.42543643712997437},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4127046763896942},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40880194306373596},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39532679319381714},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.31409555673599243},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.30713656544685364},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.24362608790397644},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19685155153274536},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.18683260679244995},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.163884699344635},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3530800.3534532","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3530800.3534532","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th International Workshop on the Theory and Practice of Provenance","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1997944350","https://openalex.org/W2086504823","https://openalex.org/W2124509324","https://openalex.org/W2151103935","https://openalex.org/W2408388496","https://openalex.org/W2949985202","https://openalex.org/W2963469388","https://openalex.org/W3003257820"],"related_works":["https://openalex.org/W2811335600","https://openalex.org/W1548642819","https://openalex.org/W2118410043","https://openalex.org/W2111242237","https://openalex.org/W2110166424","https://openalex.org/W3049072127","https://openalex.org/W4239902399","https://openalex.org/W3197477509","https://openalex.org/W3183008607","https://openalex.org/W2001439237"],"abstract_inverted_index":{"One":[0],"can":[1],"approximate":[2,101,152,265,279],"the":[3,33,46,65,118,122,130,134,174,178,184,199,203,223,258,263,277],"lineage":[4,21,47],"of":[5,14,30,42,61,73,108,113,158,177,202,228,236,243],"a":[6,11,28,52,106,145,189,211,241],"Database":[7],"(DB)":[8],"tuple":[9],"using":[10,23],"small":[12],"set":[13,29,77,82,107,242],"low":[15],"dimensional":[16],"vectors.":[17,251],"To":[18,93],"identify":[19],"actual":[20],"tuples":[22],"these":[24,237],"vector":[25,165,267,291],"sets,":[26,141],"given":[27,105],"vectors":[31,43,109,114,244],"(of":[32],"target":[34],"tuple),":[35],"one":[36,75,80],"needs":[37],"to":[38,182,256],"locate":[39],"\"close\"":[40],"sets":[41,57,112,124,138,227],"associated":[44],"with":[45,226],"tuples.":[48],"We":[49,172],"first":[50],"consider":[51],"similarity":[53,86,131,204,275],"measure":[54,87,181],"between":[55,71],"two":[56],"A":[58,78,110,245],"and":[59,67,79,90,111,168,273],"B":[60],"vectors,":[62,74],"that":[63,104,128],"balances":[64],"average":[66],"maximum":[68],"cosine":[69,179],"distance":[70,180],"pairs":[72],"from":[76,81],"B.":[83],"The":[84,231],"proposed":[85,278],"is":[88,144,239],"intuitive":[89],"permutation":[91],"invariant.":[92],"practically":[94],"realize":[95],"this":[96,194,207,216],"measure,":[97],"we":[98,209,219,253],"need":[99],"an":[100,286],"search":[102,153,160,186,191,260,268,280,289],"algorithm":[103,119],"B1,":[115],"...,":[116,126],"Bn,":[117],"quickly":[120],"locates":[121],"k-closest":[123],"Bi1":[125],"Bik":[127],"maximize":[129],"measure.":[132,205],"For":[133,206,215,270],"case":[135],"where":[136],"all":[137],"are":[139,149,254],"singleton":[140],"essentially":[142],"each":[143],"single":[146],"vector,":[147],"there":[148],"known":[150],"efficient":[151],"algorithms,":[154,161],"e.g.,":[155],"approximated":[156],"versions":[157],"tree":[159],"locality-sensitive":[162],"hashing":[163],"(LSH),":[164],"quantization":[166],"(VQ)":[167],"proximity":[169],"graph":[170],"algorithms.":[171],"utilize":[173],"mathematical":[175],"properties":[176],"transform":[183,257],"set-set":[185,259],"problem":[187,261],"into":[188,262],"vector-vector":[190],"problem.":[192,269],"However,":[193],"abovementioned":[195],"transformation":[196],"cannot":[197],"handle":[198],"Euclidean-based":[200,274],"version":[201],"version,":[208],"devise":[210],"more":[212],"elaborate":[213],"transformation.":[214],"latter":[217],"transformation,":[218],"present":[220],"algorithms":[221],"for":[222],"general":[224],"case,":[225],"differing":[229],"cardinalities.":[230],"underlying":[232],"idea":[233],"in":[234],"both":[235,271],"transformations":[238],"encoding":[240],"via":[246],"|A|":[247],"\"long\"":[248],"independent":[249],"representative":[250],"Then,":[252],"able":[255],"well-studied":[264],"(ordinary)":[266],"cosine-based":[272],"measures,":[276],"achieves":[281],"significant":[282],"performance":[283],"gains":[284],"over":[285],"optimized,":[287],"exact":[288],"on":[290],"sets.":[292]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
