{"id":"https://openalex.org/W2983182114","doi":"https://doi.org/10.1145/3356999.3365465","title":"Fast proximity graph generation with spark","display_name":"Fast proximity graph generation with spark","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W2983182114","doi":"https://doi.org/10.1145/3356999.3365465","mag":"2983182114"},"language":"en","primary_location":{"id":"doi:10.1145/3356999.3365465","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3356999.3365465","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th ACM SIGSPATIAL International Workshop on Analytics for Big Geospatial Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054960999","display_name":"Arjun Subramanyam Varalakshmi","orcid":null},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Arjun Subramanyam Varalakshmi","raw_affiliation_strings":["The University of Houston"],"affiliations":[{"raw_affiliation_string":"The University of Houston","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329446","display_name":"Chong Wang","orcid":"https://orcid.org/0000-0002-4286-4902"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chong Wang","raw_affiliation_strings":["The University of Houston"],"affiliations":[{"raw_affiliation_string":"The University of Houston","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056584154","display_name":"Christoph F. Eick","orcid":"https://orcid.org/0000-0002-6798-103X"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christoph F. Eick","raw_affiliation_strings":["The University of Houston"],"affiliations":[{"raw_affiliation_string":"The University of Houston","institution_ids":["https://openalex.org/I44461941"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5054960999"],"corresponding_institution_ids":["https://openalex.org/I44461941"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.12372653,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7408899068832397},{"id":"https://openalex.org/keywords/delaunay-triangulation","display_name":"Delaunay triangulation","score":0.6749907732009888},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.6020293831825256},{"id":"https://openalex.org/keywords/voronoi-diagram","display_name":"Voronoi diagram","score":0.5585760474205017},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.556167483329773},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5450047850608826},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.48471593856811523},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4725976586341858},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.4576219320297241},{"id":"https://openalex.org/keywords/graph-drawing","display_name":"Graph drawing","score":0.416852742433548},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3641621470451355},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.335898220539093},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32794758677482605},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22726041078567505},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.19010788202285767},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.16886457800865173},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16314315795898438},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11500215530395508}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7408899068832397},{"id":"https://openalex.org/C68010082","wikidata":"https://www.wikidata.org/wiki/Q192445","display_name":"Delaunay triangulation","level":2,"score":0.6749907732009888},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.6020293831825256},{"id":"https://openalex.org/C24881265","wikidata":"https://www.wikidata.org/wiki/Q757267","display_name":"Voronoi diagram","level":2,"score":0.5585760474205017},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.556167483329773},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5450047850608826},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.48471593856811523},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4725976586341858},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.4576219320297241},{"id":"https://openalex.org/C112953755","wikidata":"https://www.wikidata.org/wiki/Q739462","display_name":"Graph drawing","level":3,"score":0.416852742433548},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3641621470451355},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.335898220539093},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32794758677482605},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22726041078567505},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.19010788202285767},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.16886457800865173},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16314315795898438},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11500215530395508},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3356999.3365465","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3356999.3365465","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th ACM SIGSPATIAL International Workshop on Analytics for Big Geospatial Data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.7200000286102295,"display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W1823516953","https://openalex.org/W1970754929","https://openalex.org/W2051614712","https://openalex.org/W2052165970","https://openalex.org/W2084616604","https://openalex.org/W2140027094","https://openalex.org/W6657849155"],"related_works":["https://openalex.org/W3020555194","https://openalex.org/W1481755670","https://openalex.org/W2354869996","https://openalex.org/W2359751290","https://openalex.org/W2206755844","https://openalex.org/W431872879","https://openalex.org/W2371448287","https://openalex.org/W2358109229","https://openalex.org/W2096247527","https://openalex.org/W98646666"],"abstract_inverted_index":{"Since":[0],"the":[1,11,18,85,98,106,115,123,127,135,146,152,168,240],"early":[2],"1980s,":[3],"proximity":[4,21,65,180],"graphs":[5,22,29,32,66],"have":[6],"served":[7],"as":[8,151],"one":[9,201],"of":[10,53,89,148,161,187,197,250],"classical":[12],"approaches":[13],"to":[14,63,189,217,234],"characterize":[15],"neighborhood":[16],"relationships;":[17],"most":[19],"popular":[20],"include":[23],"Delaunay":[24],"Triangulation":[25],"(DT)":[26],"and":[27,49,81,100,121,129,139,192,202,207,214,220,232,239,245],"Gabriel":[28],"(GG).":[30],"These":[31],"find":[33],"their":[34,173],"applications":[35],"in":[36],"geographical":[37],"analysis,":[38,40,48],"spatial":[39,107],"pattern":[41],"recognition,":[42],"evolutionary":[43],"biology,":[44],"computer":[45],"vision,":[46],"cluster":[47,86],"visualization.":[50],"The":[51],"emergence":[52],"big":[54],"data":[55,205],"has":[56],"created":[57],"a":[58,75,110,162,195],"need":[59],"for":[60,67,78,117,194,242,247],"scalable":[61],"algorithms":[62,183],"generate":[64],"massive":[68],"datasets.":[69],"In":[70],"this":[71],"paper,":[72],"we":[73,95,113,133,144],"propose":[74],"novel":[76],"approach":[77],"creating":[79,243],"DT":[80,116,169,191,219,231],"GG":[82,155,193],"by":[83,164],"leveraging":[84],"computing":[87],"capabilities":[88],"Apache":[90],"Spark.":[91],"To":[92],"compute":[93,114],"DT,":[94,163],"rely":[96],"on":[97,159,185,230,237],"divide":[99],"conquer":[101],"paradigm.":[102],"We":[103,177],"first":[104],"partition":[105,120],"dataset":[108],"into":[109,126],"grid;":[111],"next,":[112,132],"each":[118],"grid":[119],"separate":[122],"resulting":[124],"triangles":[125,150],"core":[128],"boundary":[130,141],"triangles;":[131,142],"merge":[134],"adjacent":[136],"partitions":[137],"recursively":[138],"recompute":[140],"finally,":[143],"return":[145],"union":[147],"obtained":[149],"final":[153],"result.":[154],"generation":[156,182],"is":[157],"implemented":[158],"top":[160,186],"removing":[165],"edges":[166],"from":[167],"not":[170],"intersected":[171],"with":[172,211],"corresponding":[174],"Voronoi":[175],"edge.":[176],"evaluate":[178],"our":[179,209],"graph":[181],"built":[184],"Spark":[188],"create":[190,218],"benchmark":[196,223],"datasets":[198,248],"having":[199],"between":[200],"thirty":[203,251],"million":[204,252],"records":[206],"compare":[208],"framework":[210],"existing":[212],"Python":[213],"R":[215],"libraries":[216],"GG.":[221],"Our":[222],"tests":[224],"showcase":[225],"significant":[226],"performance":[227],"improvements(2":[228],"times":[229,236],"up":[233],"24":[235],"GG)":[238],"capability":[241],"DTs":[244],"GGs":[246],"consisting":[249],"records.":[253]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
