{"id":"https://openalex.org/W2019336343","doi":"https://doi.org/10.1145/1401890.1401921","title":"Locality sensitive hash functions based on concomitant rank order statistics","display_name":"Locality sensitive hash functions based on concomitant rank order statistics","publication_year":2008,"publication_date":"2008-08-24","ids":{"openalex":"https://openalex.org/W2019336343","doi":"https://doi.org/10.1145/1401890.1401921","mag":"2019336343"},"language":"en","primary_location":{"id":"doi:10.1145/1401890.1401921","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1401890.1401921","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088426443","display_name":"Kave Eshghi","orcid":"https://orcid.org/0000-0003-3374-3145"},"institutions":[{"id":"https://openalex.org/I1324840837","display_name":"Hewlett-Packard (United States)","ror":"https://ror.org/059rn9488","country_code":"US","type":"company","lineage":["https://openalex.org/I1324840837"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kave Eshghi","raw_affiliation_strings":["Hewlett Packard Laboratories, Palo Alto, CA, USA"],"affiliations":[{"raw_affiliation_string":"Hewlett Packard Laboratories, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I1324840837"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103446659","display_name":"Shyamsundar Rajaram","orcid":null},"institutions":[{"id":"https://openalex.org/I1324840837","display_name":"Hewlett-Packard (United States)","ror":"https://ror.org/059rn9488","country_code":"US","type":"company","lineage":["https://openalex.org/I1324840837"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shyamsundar Rajaram","raw_affiliation_strings":["Hewlett Packard Laboratories, Palo Alto, CA, USA"],"affiliations":[{"raw_affiliation_string":"Hewlett Packard Laboratories, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I1324840837"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5088426443"],"corresponding_institution_ids":["https://openalex.org/I1324840837"],"apc_list":null,"apc_paid":null,"fwci":3.1606,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.92005396,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"221","last_page":"229"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.7324908971786499},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.6463366150856018},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.6298630833625793},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.613955557346344},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.57733154296875},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5314615964889526},{"id":"https://openalex.org/keywords/bivariate-analysis","display_name":"Bivariate analysis","score":0.5303545594215393},{"id":"https://openalex.org/keywords/k-independent-hashing","display_name":"K-independent hashing","score":0.5090693831443787},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.49911022186279297},{"id":"https://openalex.org/keywords/perfect-hash-function","display_name":"Perfect hash function","score":0.44343143701553345},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4280017912387848},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.35776054859161377},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.33455610275268555},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.30348461866378784},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2105933129787445},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2097245454788208},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.10858017206192017},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.07980048656463623}],"concepts":[{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.7324908971786499},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6463366150856018},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.6298630833625793},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.613955557346344},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.57733154296875},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5314615964889526},{"id":"https://openalex.org/C64341305","wikidata":"https://www.wikidata.org/wiki/Q4919225","display_name":"Bivariate analysis","level":2,"score":0.5303545594215393},{"id":"https://openalex.org/C187062812","wikidata":"https://www.wikidata.org/wiki/Q6322840","display_name":"K-independent hashing","level":5,"score":0.5090693831443787},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.49911022186279297},{"id":"https://openalex.org/C87431388","wikidata":"https://www.wikidata.org/wiki/Q2070573","display_name":"Perfect hash function","level":4,"score":0.44343143701553345},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4280017912387848},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.35776054859161377},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.33455610275268555},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.30348461866378784},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2105933129787445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2097245454788208},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.10858017206192017},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.07980048656463623},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1401890.1401921","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1401890.1401921","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334763","display_name":"Leibniz-Gemeinschaft","ror":"https://ror.org/01n6r0e97"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W112162828","https://openalex.org/W1517583229","https://openalex.org/W1577871831","https://openalex.org/W1964201646","https://openalex.org/W2012833704","https://openalex.org/W2041836310","https://openalex.org/W2055289292","https://openalex.org/W2071572981","https://openalex.org/W2122056984","https://openalex.org/W2145065594","https://openalex.org/W2147717514","https://openalex.org/W2151103935","https://openalex.org/W2162006472","https://openalex.org/W2165612380","https://openalex.org/W2172232203","https://openalex.org/W2435338979","https://openalex.org/W3005890292","https://openalex.org/W3119059448","https://openalex.org/W4300092438"],"related_works":["https://openalex.org/W2100189723","https://openalex.org/W2072057882","https://openalex.org/W2962718115","https://openalex.org/W2094127768","https://openalex.org/W2604946233","https://openalex.org/W2772711833","https://openalex.org/W2951390818","https://openalex.org/W2963563740","https://openalex.org/W2257108927","https://openalex.org/W3136593074"],"abstract_inverted_index":{"Locality":[0],"Sensitive":[1],"Hash":[2],"functions":[3,46],"are":[4,20],"invaluable":[5],"tools":[6],"for":[7,47,127],"approximate":[8],"near":[9],"neighbor":[10],"problems":[11],"in":[12,60,97],"high":[13],"dimensional":[14],"spaces.":[15],"In":[16],"this":[17,36],"work,":[18],"we":[19],"focused":[21],"on":[22,53],"LSH":[23],"schemes":[24],"where":[25],"the":[26,30,48,54,87,90,98,111,128],"similarity":[27,50],"metric":[28],"is":[29,38],"cosine":[31,49,129],"measure.":[32,130],"The":[33],"contribution":[34],"of":[35,42,56,93,100,110],"work":[37],"a":[39,79,101,116],"new":[40],"class":[41],"locality":[43,117],"sensitive":[44,118],"hash":[45,119],"measure":[51],"based":[52],"theory":[55,85],"concomitants,":[57],"which":[58],"arises":[59],"order":[61,91],"statistics.":[62],"Consider":[63],"n":[64],"i.i.d":[65],"sample":[66],"pairs,":[67],"{(X1;":[68],"Y1);":[69],"(X2;":[70],"Y2);":[71],":":[72,73,74],";(Xn;":[75],"Yn)}":[76],"obtained":[77],"from":[78],"bivariate":[80],"distribution":[81,103,113],"f(X,":[82],"Y).":[83],"Concomitant":[84],"captures":[86],"relation":[88],"between":[89],"statistics":[92],"X":[94],"and":[95],"Y":[96],"form":[99],"rank":[102,112],"given":[104],"by":[105],"Prob(Rank(Yi)=j-Rank(Xi)=k).":[106],"We":[107],"exploit":[108],"properties":[109,126],"towards":[114],"developing":[115],"family":[120],"that":[121],"has":[122],"excellent":[123],"collision":[124],"rate":[125]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
