{"id":"https://openalex.org/W2741444967","doi":"https://doi.org/10.3390/informatics4030024","title":"Big Data Management with Incremental K-Means Trees\u2013GPU-Accelerated Construction and Visualization","display_name":"Big Data Management with Incremental K-Means Trees\u2013GPU-Accelerated Construction and Visualization","publication_year":2017,"publication_date":"2017-07-28","ids":{"openalex":"https://openalex.org/W2741444967","doi":"https://doi.org/10.3390/informatics4030024","mag":"2741444967"},"language":"en","primary_location":{"id":"doi:10.3390/informatics4030024","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4030024","pdf_url":"https://www.mdpi.com/2227-9709/4/3/24/pdf?version=1501247188","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2227-9709/4/3/24/pdf?version=1501247188","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012387700","display_name":"Jun Wang","orcid":"https://orcid.org/0000-0002-7334-0490"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jun Wang","raw_affiliation_strings":["Visual Analytics and Imaging Lab, Computer Science Department, Stony Brook University, Stony Brook, NY 11794, USA"],"affiliations":[{"raw_affiliation_string":"Visual Analytics and Imaging Lab, Computer Science Department, Stony Brook University, Stony Brook, NY 11794, USA","institution_ids":["https://openalex.org/I59553526"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047588154","display_name":"Alla Zelenyuk","orcid":"https://orcid.org/0000-0002-0674-0910"},"institutions":[{"id":"https://openalex.org/I4210139016","display_name":"Material Sciences (United States)","ror":"https://ror.org/046v9f126","country_code":"US","type":"company","lineage":["https://openalex.org/I4210139016"]},{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alla Zelenyuk","raw_affiliation_strings":["Chemical and Material Sciences Division, Pacific Northwest National Laboratory, Richland, WA 99352, USA"],"affiliations":[{"raw_affiliation_string":"Chemical and Material Sciences Division, Pacific Northwest National Laboratory, Richland, WA 99352, USA","institution_ids":["https://openalex.org/I142606810","https://openalex.org/I4210139016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109177988","display_name":"Dan Imre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dan Imre","raw_affiliation_strings":["Imre Consulting, Richland, WA 99352, USA"],"affiliations":[{"raw_affiliation_string":"Imre Consulting, Richland, WA 99352, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070670810","display_name":"Klaus Mueller","orcid":"https://orcid.org/0000-0002-0996-8590"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Klaus Mueller","raw_affiliation_strings":["Visual Analytics and Imaging Lab, Computer Science Department, Stony Brook University, Stony Brook, NY 11794, USA"],"affiliations":[{"raw_affiliation_string":"Visual Analytics and Imaging Lab, Computer Science Department, Stony Brook University, Stony Brook, NY 11794, USA","institution_ids":["https://openalex.org/I59553526"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5070670810"],"corresponding_institution_ids":["https://openalex.org/I59553526"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":0.4625,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.72921905,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"4","issue":"3","first_page":"24","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8045575618743896},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.724705696105957},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6913793087005615},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.5765286684036255},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.5680676698684692},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.5655914545059204},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.5572559833526611},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5132179260253906},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.4977989196777344},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4910752773284912},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.4446898102760315},{"id":"https://openalex.org/keywords/data-management","display_name":"Data management","score":0.4129839241504669},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4014281630516052},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.34699904918670654},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3115256428718567},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24461013078689575},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.19458836317062378},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09614193439483643}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8045575618743896},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.724705696105957},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6913793087005615},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5765286684036255},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.5680676698684692},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.5655914545059204},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.5572559833526611},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5132179260253906},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.4977989196777344},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4910752773284912},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.4446898102760315},{"id":"https://openalex.org/C1668388","wikidata":"https://www.wikidata.org/wiki/Q1149776","display_name":"Data management","level":2,"score":0.4129839241504669},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4014281630516052},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34699904918670654},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3115256428718567},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24461013078689575},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.19458836317062378},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09614193439483643},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/informatics4030024","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4030024","pdf_url":"https://www.mdpi.com/2227-9709/4/3/24/pdf?version=1501247188","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:d8e71ef0d2004dcc9b7b96742a3767a0","is_oa":true,"landing_page_url":"https://doaj.org/article/d8e71ef0d2004dcc9b7b96742a3767a0","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Informatics, Vol 4, Iss 3, p 24 (2017)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2227-9709/4/3/24/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/informatics4030024","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Informatics; Volume 4; Issue 3; Pages: 24","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/informatics4030024","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4030024","pdf_url":"https://www.mdpi.com/2227-9709/4/3/24/pdf?version=1501247188","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G1671782611","display_name":null,"funder_award_id":"DE-AC06-76RL0","funder_id":"https://openalex.org/F4320338354","funder_display_name":"Pacific Northwest National Laboratory"},{"id":"https://openalex.org/G5195000505","display_name":null,"funder_award_id":"Geosciences","funder_id":"https://openalex.org/F4320332359","funder_display_name":"Office of Science"},{"id":"https://openalex.org/G5576501225","display_name":null,"funder_award_id":"1527200","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6343642018","display_name":null,"funder_award_id":"IIS 1527200","funder_id":"https://openalex.org/F4320322065","funder_display_name":"National IT Industry Promotion Agency"},{"id":"https://openalex.org/G7908228807","display_name":null,"funder_award_id":"Molecular","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8055749809","display_name":null,"funder_award_id":"IIS 1527200","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8062368548","display_name":null,"funder_award_id":"IIS 1527200","funder_id":"https://openalex.org/F4320322030","funder_display_name":"Ministry of Science, ICT and Future Planning"},{"id":"https://openalex.org/G8414908677","display_name":null,"funder_award_id":"DE-AC0","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320306250","display_name":"Battelle","ror":"https://ror.org/01h5tnr73"},{"id":"https://openalex.org/F4320322030","display_name":"Ministry of Science, ICT and Future Planning","ror":"https://ror.org/032e49973"},{"id":"https://openalex.org/F4320322065","display_name":"National IT Industry Promotion Agency","ror":"https://ror.org/026v53e29"},{"id":"https://openalex.org/F4320332359","display_name":"Office of Science","ror":"https://ror.org/00mmn6b08"},{"id":"https://openalex.org/F4320337480","display_name":"Basic Energy Sciences","ror":"https://ror.org/05mg91w61"},{"id":"https://openalex.org/F4320338354","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2741444967.pdf","grobid_xml":"https://content.openalex.org/works/W2741444967.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W191714665","https://openalex.org/W1566114229","https://openalex.org/W1673310716","https://openalex.org/W1977496278","https://openalex.org/W1995450389","https://openalex.org/W1996510517","https://openalex.org/W2015381165","https://openalex.org/W2015449696","https://openalex.org/W2016728733","https://openalex.org/W2022014952","https://openalex.org/W2024668293","https://openalex.org/W2042932437","https://openalex.org/W2049633694","https://openalex.org/W2057923756","https://openalex.org/W2071321484","https://openalex.org/W2086504823","https://openalex.org/W2095897464","https://openalex.org/W2099253838","https://openalex.org/W2110122118","https://openalex.org/W2111920879","https://openalex.org/W2118411523","https://openalex.org/W2118558147","https://openalex.org/W2127218421","https://openalex.org/W2128017662","https://openalex.org/W2131174057","https://openalex.org/W2141585940","https://openalex.org/W2155893237","https://openalex.org/W2164967414","https://openalex.org/W2165558283","https://openalex.org/W2187089797","https://openalex.org/W2950094539","https://openalex.org/W4247105055","https://openalex.org/W6633857196","https://openalex.org/W6656074177","https://openalex.org/W6679055200"],"related_works":["https://openalex.org/W3062287","https://openalex.org/W2380390332","https://openalex.org/W2742145873","https://openalex.org/W4245975140","https://openalex.org/W2062253548","https://openalex.org/W4225414539","https://openalex.org/W4289522463","https://openalex.org/W1977763331","https://openalex.org/W4318483369","https://openalex.org/W2368291996"],"abstract_inverted_index":{"While":[0],"big":[1,58,172],"data":[2,10,59,76],"is":[3,26,51,137,156],"revolutionizing":[4],"scientific":[5],"research,":[6],"the":[7,24,29,34,37,42,45,48,54,66,95,103,115,124,127,130,146,176,183],"tasks":[8],"of":[9,44,47,75,117,126,132],"management":[11],"and":[12,129,155,182,191],"analytics":[13],"are":[14,68,185],"becoming":[15],"more":[16],"challenging":[17],"than":[18],"ever.":[19],"One":[20],"way":[21],"to":[22,27,72,143,171],"remit":[23],"difficulty":[25],"obtain":[28],"multilevel":[30],"hierarchy":[31,38,67],"embedded":[32],"in":[33,57,84,105],"data.":[35,99,173],"Knowing":[36],"enables":[39],"not":[40,70],"only":[41],"revelation":[43],"nature":[46],"data,":[49],"it":[50,166],"also":[52,138],"often":[53],"first":[55],"step":[56],"analytics.":[60],"However,":[61],"current":[62],"algorithms":[63],"for":[64,93],"learning":[65],"typically":[69],"scalable":[71,91],"large":[73],"volumes":[74],"with":[77,109,158,178,187],"high":[78],"dimensionality.":[79],"To":[80],"tackle":[81],"this":[82,85],"challenge,":[83],"paper,":[86],"we":[87],"propose":[88],"a":[89,106,141,152],"new":[90],"approach":[92],"constructing":[94],"tree":[96,104,128],"structure":[97],"from":[98],"Our":[100],"method":[101],"builds":[102],"bottom-up":[107],"manner,":[108],"adapted":[110],"incremental":[111],"k-means.":[112],"By":[113],"referencing":[114],"distribution":[116],"point":[118],"distances,":[119],"one":[120],"can":[121,167],"flexibly":[122],"control":[123],"height":[125],"branching":[131],"each":[133],"node.":[134],"Dimension":[135],"reduction":[136],"conducted":[139],"as":[140],"pre-process,":[142],"further":[144],"boost":[145],"computing":[147],"efficiency.":[148],"The":[149],"algorithm":[150,177],"takes":[151],"parallel":[153],"design":[154],"implemented":[157],"CUDA":[159],"(Compute":[160],"Unified":[161],"Device":[162],"Architecture),":[163],"so":[164],"that":[165],"be":[168],"efficiently":[169],"applied":[170],"We":[174],"test":[175],"two":[179],"real-world":[180],"datasets,":[181],"results":[184],"visualized":[186],"extended":[188],"circular":[189],"dendrograms":[190],"other":[192],"visualization":[193],"techniques.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2017-08-08T00:00:00"}
