{"id":"https://openalex.org/W2766364198","doi":"https://doi.org/10.1109/icinfa.2017.8079062","title":"Research on K nearest neighbor join for big data","display_name":"Research on K nearest neighbor join for big data","publication_year":2017,"publication_date":"2017-07-01","ids":{"openalex":"https://openalex.org/W2766364198","doi":"https://doi.org/10.1109/icinfa.2017.8079062","mag":"2766364198"},"language":"en","primary_location":{"id":"doi:10.1109/icinfa.2017.8079062","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icinfa.2017.8079062","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Information and Automation (ICIA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103785417","display_name":"Ji JiaQi","orcid":null},"institutions":[{"id":"https://openalex.org/I77079311","display_name":"Wonkwang University","ror":"https://ror.org/006776986","country_code":"KR","type":"education","lineage":["https://openalex.org/I77079311"]},{"id":"https://openalex.org/I94611258","display_name":"Hebei Normal University","ror":"https://ror.org/004rbbw49","country_code":"CN","type":"education","lineage":["https://openalex.org/I94611258"]}],"countries":["CN","KR"],"is_corresponding":true,"raw_author_name":"Ji Jiaqi","raw_affiliation_strings":["Department of Computer Engineering, Wonkwang University, Iksan","Korean Department of information center, Hebei Normal University for Nationalities, Chengde, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Wonkwang University, Iksan","institution_ids":["https://openalex.org/I77079311"]},{"raw_affiliation_string":"Korean Department of information center, Hebei Normal University for Nationalities, Chengde, China","institution_ids":["https://openalex.org/I94611258"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056075408","display_name":"Yeong-Jee Chung","orcid":null},"institutions":[{"id":"https://openalex.org/I77079311","display_name":"Wonkwang University","ror":"https://ror.org/006776986","country_code":"KR","type":"education","lineage":["https://openalex.org/I77079311"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yeongjee Chung","raw_affiliation_strings":["Department of Computer Engineering, Wonkwang University, Iksan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Wonkwang University, Iksan","institution_ids":["https://openalex.org/I77079311"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5103785417"],"corresponding_institution_ids":["https://openalex.org/I77079311","https://openalex.org/I94611258"],"apc_list":null,"apc_paid":null,"fwci":0.1849,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.47133099,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"1","issue":null,"first_page":"1077","last_page":"1081"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/join","display_name":"Join (topology)","score":0.8346896171569824},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.7320684194564819},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.7173184752464294},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7136668562889099},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.6888145804405212},{"id":"https://openalex.org/keywords/nearest-neighbor-chain-algorithm","display_name":"Nearest-neighbor chain algorithm","score":0.6682890057563782},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5910968780517578},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.5532307028770447},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.52346271276474},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.46995142102241516},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.4638836979866028},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46065282821655273},{"id":"https://openalex.org/keywords/volume","display_name":"Volume (thermodynamics)","score":0.44860249757766724},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.4156954884529114},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3572757840156555},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.3103097379207611},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2553362548351288},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19785264134407043},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13093024492263794},{"id":"https://openalex.org/keywords/canopy-clustering-algorithm","display_name":"Canopy clustering algorithm","score":0.06779369711875916}],"concepts":[{"id":"https://openalex.org/C2776124973","wikidata":"https://www.wikidata.org/wiki/Q3183033","display_name":"Join (topology)","level":2,"score":0.8346896171569824},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.7320684194564819},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.7173184752464294},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7136668562889099},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.6888145804405212},{"id":"https://openalex.org/C102164700","wikidata":"https://www.wikidata.org/wiki/Q17162702","display_name":"Nearest-neighbor chain algorithm","level":5,"score":0.6682890057563782},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5910968780517578},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.5532307028770447},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.52346271276474},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.46995142102241516},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.4638836979866028},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46065282821655273},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.44860249757766724},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.4156954884529114},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3572757840156555},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.3103097379207611},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2553362548351288},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19785264134407043},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13093024492263794},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.06779369711875916},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icinfa.2017.8079062","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icinfa.2017.8079062","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Information and Automation (ICIA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W195533127","https://openalex.org/W2016854254","https://openalex.org/W2055398586","https://openalex.org/W2248980053","https://openalex.org/W2280045208","https://openalex.org/W2290145898","https://openalex.org/W2294063811","https://openalex.org/W2305675433","https://openalex.org/W2345395130","https://openalex.org/W2432436793","https://openalex.org/W2542459869","https://openalex.org/W2546169252","https://openalex.org/W2578717751","https://openalex.org/W2584010011","https://openalex.org/W2586932945","https://openalex.org/W2601797069","https://openalex.org/W4237196177","https://openalex.org/W6691403539","https://openalex.org/W6694970861"],"related_works":["https://openalex.org/W2166822184","https://openalex.org/W2148008870","https://openalex.org/W2011582495","https://openalex.org/W2169618946","https://openalex.org/W2182477562","https://openalex.org/W2143679819","https://openalex.org/W2519241726","https://openalex.org/W3096071782","https://openalex.org/W2902799860","https://openalex.org/W4289129280"],"abstract_inverted_index":{"K":[0],"Nearest":[1],"Neighbor":[2],"Join":[3,31],"(KNN":[4],"Join)":[5],"is":[6,32,77,121],"a":[7,18,33,60,69],"primitive":[8],"operation":[9],"widely":[10],"adopted":[11],"by":[12],"many":[13],"data":[14,42,45],"mining":[15],"applications.":[16],"As":[17],"combination":[19],"of":[20,41,67,95,102],"the":[21,27,39,47,65,87,93,100,105],"k":[22,96],"nearest":[23,97],"neighbor":[24],"query":[25],"and":[26,44,123],"join":[28],"operation,":[29],"KNN":[30],"computationally":[34],"intensive":[35],"algorithm;":[36],"however,":[37],"with":[38],"increase":[40],"volume":[43],"dimension,":[46],"results":[48,115],"can't":[49],"be":[50,108],"obtained":[51],"within":[52],"acceptable":[53],"time":[54],"when":[55],"this":[56,118],"algorithm":[57,81],"runs":[58],"on":[59,64,111],"single":[61],"machine.":[62],"Consequently,":[63],"basis":[66],"Spark,":[68],"new":[70],"approach":[71,120],"that":[72,117],"employs":[73],"Locality-Sensitive":[74],"Hashing":[75],"(LSH)":[76],"proposed.":[78],"The":[79,113],"LSH":[80],"first":[82],"maps":[83],"similar":[84],"objects":[85,103],"onto":[86],"same":[88],"bucket,":[89],"which":[90],"can":[91,107],"reduce":[92],"set":[94],"neighbors;":[98],"then":[99],"distance":[101],"in":[104],"cluster,":[106],"calculated":[109],"based":[110],"Spark.":[112],"experimental":[114],"show":[116],"proposed":[119],"accurate":[122],"effective":[124],"for":[125],"high":[126],"dimensional":[127],"big":[128],"data.":[129]},"counts_by_year":[{"year":2023,"cited_by_count":5},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
