{"id":"https://openalex.org/W2794739930","doi":"https://doi.org/10.1145/3190645.3190700","title":"Using locality sensitive hashing to improve the KNN algorithm in the mapreduce framework","display_name":"Using locality sensitive hashing to improve the KNN algorithm in the mapreduce framework","publication_year":2018,"publication_date":"2018-03-29","ids":{"openalex":"https://openalex.org/W2794739930","doi":"https://doi.org/10.1145/3190645.3190700","mag":"2794739930"},"language":"en","primary_location":{"id":"doi:10.1145/3190645.3190700","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3190645.3190700","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACMSE 2018 Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038428882","display_name":"Sikha Bagui","orcid":"https://orcid.org/0000-0002-1886-4582"},"institutions":[{"id":"https://openalex.org/I83683471","display_name":"University of West Florida","ror":"https://ror.org/002w4zy91","country_code":"US","type":"education","lineage":["https://openalex.org/I83683471"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sikha Bagui","raw_affiliation_strings":["University of West Florida"],"affiliations":[{"raw_affiliation_string":"University of West Florida","institution_ids":["https://openalex.org/I83683471"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082115478","display_name":"Arup Mondal","orcid":"https://orcid.org/0000-0002-8970-3380"},"institutions":[{"id":"https://openalex.org/I83683471","display_name":"University of West Florida","ror":"https://ror.org/002w4zy91","country_code":"US","type":"education","lineage":["https://openalex.org/I83683471"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arup Kumar Mondal","raw_affiliation_strings":["University of West Florida"],"affiliations":[{"raw_affiliation_string":"University of West Florida","institution_ids":["https://openalex.org/I83683471"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110966564","display_name":"Subhash Bagui","orcid":null},"institutions":[{"id":"https://openalex.org/I83683471","display_name":"University of West Florida","ror":"https://ror.org/002w4zy91","country_code":"US","type":"education","lineage":["https://openalex.org/I83683471"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Subhash Bagui","raw_affiliation_strings":["University of West Florida"],"affiliations":[{"raw_affiliation_string":"University of West Florida","institution_ids":["https://openalex.org/I83683471"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5038428882"],"corresponding_institution_ids":["https://openalex.org/I83683471"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02478312,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.78546142578125},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7636159658432007},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.7241709232330322},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.5552470684051514},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4933415949344635},{"id":"https://openalex.org/keywords/jaccard-index","display_name":"Jaccard index","score":0.48635751008987427},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.46981102228164673},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4655761122703552},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4290401339530945},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.41679179668426514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3787570595741272},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.31780868768692017}],"concepts":[{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.78546142578125},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7636159658432007},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.7241709232330322},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.5552470684051514},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4933415949344635},{"id":"https://openalex.org/C203519979","wikidata":"https://www.wikidata.org/wiki/Q865360","display_name":"Jaccard index","level":3,"score":0.48635751008987427},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.46981102228164673},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4655761122703552},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4290401339530945},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.41679179668426514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3787570595741272},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.31780868768692017},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3190645.3190700","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3190645.3190700","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACMSE 2018 Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2911483473","https://openalex.org/W2148008870","https://openalex.org/W2381195555","https://openalex.org/W4401133510","https://openalex.org/W2166822184","https://openalex.org/W3096071782","https://openalex.org/W2902799860","https://openalex.org/W4289129280","https://openalex.org/W2754607325","https://openalex.org/W2901290148"],"abstract_inverted_index":{"The":[0,20,38,149,206,278],"K-Nearest":[1],"Neighbor!":[2],"(KNN)":[3],"algorithm":[4,21,41,151],"is":[5,126],"one":[6],"of":[7,46,121,159,175,177,202,228,235,280],"the":[8,48,60,65,69,91,97,105,122,141,162,168,173,194,199,210,214,222,233,236,241,245,281],"most":[9],"widely":[10],"used":[11,29,167],"algorithms":[12],"in":[13,25,33,59,193,252,269,285,287],"data":[14,53,57,80,86,131,179,185,191,216,301],"mining":[15],"for":[16,82,261],"classification":[17],"and":[18,55,63,88,107,137,188,247,273],"prediction.":[19],"has":[22],"several":[23,147],"applications:":[24],"facial":[26],"detection":[27],"when":[28],"with":[30,138,181],"deep":[31],"learning,":[32],"biometric":[34],"security":[35],"applications":[36],"etc.":[37],"traditional":[39],"KNN":[40,150,286,296],"involves":[42],"an":[43,259],"iterative":[44],"process":[45],"computing":[47],"distance":[49],"between":[50],"a":[51,84,130,156,178,266,270,299],"test":[52,85,92,108],"point":[54,58,87],"every":[56],"training":[61,71,79,142,164],"dataset,":[62],"classifying":[64,83],"object":[66],"based":[67,95],"on":[68,96,265],"closest":[70],"sample.":[72],"This":[73,197],"method":[74],"first":[75],"selects":[76],"K":[77],"nearest":[78],"points":[81,186,192],"then":[89,153],"predicts":[90],"sample's":[93],"class":[94,99],"majority":[98],"among":[100],"those":[101],"neighbors.":[102],"If":[103],"both":[104],"train":[106],"datasets":[109,264],"are":[110],"large,":[111],"this":[112,139],"conventional":[113,246,295],"form":[114],"can":[115],"be":[116,219],"considered":[117],"computationally":[118],"expensive.":[119],"Reduction":[120],"massive":[123,276],"calculation":[124],"that":[125],"required":[127],"to":[128,171,231,239,297],"predict":[129],"vector":[132,180],"was":[133,144,152,198,230],"our":[134,203,226],"main":[135],"goal,":[136],"intention,":[140],"dataset":[143],"split":[145],"into":[146],"buckets.":[148],"performed":[154],"inside":[155],"bucket,":[157],"instead":[158],"iterating":[160],"over":[161],"whole":[163],"dataset.":[165],"We":[166],"Jaccard":[169],"Coefficient":[170],"determine":[172],"degree":[174],"similarity":[176],"some":[182],"arbitrarily":[183],"defined":[184],"P":[187],"placed":[189],"similar":[190,215],"same":[195],"bucket.":[196],"core":[200],"functionality":[201],"hash":[204,207,237],"function.":[205],"function":[208],"determines":[209],"bucket":[211],"number":[212],"where":[213],"vectors":[217],"will":[218],"placed.":[220],"Unlike":[221],"standard":[223],"hashing":[224,229,284],"algorithm,":[225],"approach":[227],"maximize":[232],"probability":[234],"collision":[238],"preserve":[240],"locality":[242,282],"sensitiveness.":[243],"Both":[244],"proposed":[248],"methods":[249],"were":[250],"implemented":[251],"Hadoop's":[253,288],"MapReduce":[254,289],"framework.":[255],"Hadoop":[256],"gives":[257,274],"us":[258,275],"architecture":[260],"handling":[262],"large":[263],"computer":[267],"cluster":[268],"distributed":[271],"manner":[272],"scalability.":[277],"use":[279],"sensitive":[283],"environment":[290],"took":[291],"less":[292],"time":[293],"than":[294],"classify":[298],"new":[300],"object.":[302]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
