{"id":"https://openalex.org/W3216043206","doi":"https://doi.org/10.1145/3474842","title":"Significant DBSCAN+: Statistically Robust Density-based Clustering","display_name":"Significant DBSCAN+: Statistically Robust Density-based Clustering","publication_year":2021,"publication_date":"2021-10-31","ids":{"openalex":"https://openalex.org/W3216043206","doi":"https://doi.org/10.1145/3474842","mag":"3216043206"},"language":"en","primary_location":{"id":"doi:10.1145/3474842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474842","pdf_url":null,"source":{"id":"https://openalex.org/S2492086750","display_name":"ACM Transactions on Intelligent Systems and Technology","issn_l":"2157-6904","issn":["2157-6904","2157-6912"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Intelligent Systems and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049041437","display_name":"Yiqun Xie","orcid":"https://orcid.org/0000-0002-6439-1333"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yiqun Xie","raw_affiliation_strings":["University of Maryland, College Park, MD"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001445783","display_name":"Xiaowei Jia","orcid":"https://orcid.org/0000-0001-8544-5233"},"institutions":[{"id":"https://openalex.org/I170201317","display_name":"University of Pittsburgh","ror":"https://ror.org/01an3r305","country_code":"US","type":"education","lineage":["https://openalex.org/I170201317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaowei Jia","raw_affiliation_strings":["University of Pittsburgh, S. Bouquet Street Pittsburgh, PA"],"affiliations":[{"raw_affiliation_string":"University of Pittsburgh, S. Bouquet Street Pittsburgh, PA","institution_ids":["https://openalex.org/I170201317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037233397","display_name":"Shashi Shekhar","orcid":"https://orcid.org/0000-0001-8837-192X"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shashi Shekhar","raw_affiliation_strings":["University of Minnesota, Minneapolis, MN"],"affiliations":[{"raw_affiliation_string":"University of Minnesota, Minneapolis, MN","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050161940","display_name":"Han Bao","orcid":"https://orcid.org/0000-0002-0109-8260"},"institutions":[{"id":"https://openalex.org/I126307644","display_name":"University of Iowa","ror":"https://ror.org/036jqmy94","country_code":"US","type":"education","lineage":["https://openalex.org/I126307644"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Han Bao","raw_affiliation_strings":["University of Iowa, Iowa City, IA"],"affiliations":[{"raw_affiliation_string":"University of Iowa, Iowa City, IA","institution_ids":["https://openalex.org/I126307644"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086198510","display_name":"Xun Zhou","orcid":"https://orcid.org/0000-0003-4930-6572"},"institutions":[{"id":"https://openalex.org/I126307644","display_name":"University of Iowa","ror":"https://ror.org/036jqmy94","country_code":"US","type":"education","lineage":["https://openalex.org/I126307644"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xun Zhou","raw_affiliation_strings":["University of Iowa, Iowa City, IA"],"affiliations":[{"raw_affiliation_string":"University of Iowa, Iowa City, IA","institution_ids":["https://openalex.org/I126307644"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5049041437"],"corresponding_institution_ids":["https://openalex.org/I66946132"],"apc_list":null,"apc_paid":null,"fwci":1.3442,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.81359338,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"12","issue":"5","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dbscan","display_name":"DBSCAN","score":0.8785510659217834},{"id":"https://openalex.org/keywords/spurious-relationship","display_name":"Spurious relationship","score":0.8487868309020996},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8192508220672607},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7264240980148315},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5452819466590881},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4856947362422943},{"id":"https://openalex.org/keywords/randomness","display_name":"Randomness","score":0.4121703505516052},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4097459018230438},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2950236201286316},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.20193693041801453},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.15876775979995728},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1437138319015503},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.14133891463279724}],"concepts":[{"id":"https://openalex.org/C46576248","wikidata":"https://www.wikidata.org/wiki/Q1114630","display_name":"DBSCAN","level":5,"score":0.8785510659217834},{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.8487868309020996},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8192508220672607},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7264240980148315},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5452819466590881},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4856947362422943},{"id":"https://openalex.org/C125112378","wikidata":"https://www.wikidata.org/wiki/Q176640","display_name":"Randomness","level":2,"score":0.4121703505516052},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4097459018230438},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2950236201286316},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.20193693041801453},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.15876775979995728},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1437138319015503},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.14133891463279724}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3474842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474842","pdf_url":null,"source":{"id":"https://openalex.org/S2492086750","display_name":"ACM Transactions on Intelligent Systems and Technology","issn_l":"2157-6904","issn":["2157-6904","2157-6912"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Intelligent Systems and Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1061045358","display_name":null,"funder_award_id":"HM0476-20-1-0009","funder_id":"https://openalex.org/F4320306078","funder_display_name":"U.S. Department of Defense"},{"id":"https://openalex.org/G3198493938","display_name":null,"funder_award_id":"G21AC10207","funder_id":"https://openalex.org/F4320332183","funder_display_name":"U.S. Geological Survey"},{"id":"https://openalex.org/G6156412566","display_name":null,"funder_award_id":"DE-AR0000795","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G7112848026","display_name":null,"funder_award_id":"2017-51181-27222","funder_id":"https://openalex.org/F4320306114","funder_display_name":"U.S. Department of Agriculture"}],"funders":[{"id":"https://openalex.org/F4320306078","display_name":"U.S. Department of Defense","ror":"https://ror.org/0447fe631"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320306114","display_name":"U.S. Department of Agriculture","ror":"https://ror.org/01na82s61"},{"id":"https://openalex.org/F4320332183","display_name":"U.S. Geological Survey","ror":"https://ror.org/035a68863"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W151377110","https://openalex.org/W1128809682","https://openalex.org/W1601727326","https://openalex.org/W1850843018","https://openalex.org/W1977536776","https://openalex.org/W1979089718","https://openalex.org/W2002151188","https://openalex.org/W2015709235","https://openalex.org/W2022444941","https://openalex.org/W2042659752","https://openalex.org/W2083772019","https://openalex.org/W2085897675","https://openalex.org/W2092799168","https://openalex.org/W2113991440","https://openalex.org/W2122745150","https://openalex.org/W2132914434","https://openalex.org/W2139978280","https://openalex.org/W2141585940","https://openalex.org/W2153233077","https://openalex.org/W2157811729","https://openalex.org/W2180566385","https://openalex.org/W2336500050","https://openalex.org/W2586878559","https://openalex.org/W2749238013","https://openalex.org/W2807603574","https://openalex.org/W2944696257","https://openalex.org/W2963214893","https://openalex.org/W2967908858","https://openalex.org/W3008739840","https://openalex.org/W3041697790","https://openalex.org/W3084063858","https://openalex.org/W3096860278","https://openalex.org/W3103180971","https://openalex.org/W3128193561","https://openalex.org/W4213245422","https://openalex.org/W4300672471","https://openalex.org/W4402160737","https://openalex.org/W6785760900"],"related_works":["https://openalex.org/W2162899405","https://openalex.org/W3176449234","https://openalex.org/W2807508722","https://openalex.org/W2353158678","https://openalex.org/W2767235736","https://openalex.org/W4225278791","https://openalex.org/W2045002201","https://openalex.org/W2971352445","https://openalex.org/W4322502698","https://openalex.org/W2604015980"],"abstract_inverted_index":{"Cluster":[0],"detection":[1,251],"is":[2,51,208],"important":[3],"and":[4,18,38,57,67,73,83,99,121,158,259,282,293],"widely":[5],"used":[6],"in":[7,80,223,255],"a":[8,22,77,85,130,153,166,181,186,209,277],"variety":[9],"of":[10,24,87,113,132,146,156,174,177,185,205,248,264,270],"applications,":[11],"including":[12],"public":[13,15],"health,":[14],"safety,":[16],"transportation,":[17],"so":[19],"on.":[20],"Given":[21],"collection":[23],"data":[25,81],"points,":[26],"we":[27,179,201],"aim":[28],"to":[29,92,124,192,218,231,273],"detect":[30,93],"density-connected":[31],"spatial":[32],"clusters":[33,45,68,94,127,195],"with":[34,95],"varying":[35,74,97],"geometric":[36],"shapes":[37,72,98],"densities,":[39],"under":[40],"the":[41,44,110,136,144,172,214,233,245,262,283,288],"constraint":[42],"that":[43,196,212,239],"are":[46,122,197],"statistically":[47,182],"significant.":[48],"The":[49],"problem":[50],"challenging,":[52],"because":[53],"many":[54,159],"societal":[55],"applications":[56],"domain":[58],"science":[59],"studies":[60],"have":[61,70,89],"low":[62],"tolerance":[63],"for":[64,290],"spurious":[65,126,147,265,271],"results,":[66,148],"may":[69],"arbitrary":[71],"densities.":[75],"As":[76,200],"classical":[78],"topic":[79],"mining":[82],"learning,":[84],"myriad":[86],"techniques":[88,115,222],"been":[90],"developed":[91],"both":[96,175,291],"densities":[100],"(e.g.,":[101,252,267],"density-based,":[102],"hierarchical,":[103],"spectral,":[104],"or":[105,275],"deep":[106],"clustering":[107,221],"methods).":[108],"However,":[109],"vast":[111],"majority":[112],"these":[114],"do":[116],"not":[117],"consider":[118],"statistical":[119,206],"rigor":[120,207],"susceptible":[123],"detecting":[125],"formed":[128],"as":[129,165],"result":[131],"natural":[133],"randomness.":[134],"On":[135],"other":[137],"hand,":[138],"scan":[139],"statistic":[140],"approaches":[141],"explicitly":[142],"control":[143],"rate":[145,247,263],"but":[149],"they":[150],"typically":[151],"assume":[152],"single":[154],"\u201chotspot\u201d":[155],"over-density":[157],"rely":[160],"on":[161],"further":[162],"assumptions":[163],"such":[164],"tessellated":[167],"input":[168],"space.":[169],"To":[170],"unite":[171],"strengths":[173],"lines":[176],"work,":[178],"propose":[180,228],"robust":[183],"formulation":[184],"multi-scale":[187],"DBSCAN,":[188],"namely":[189],"Significant":[190,216,240],"DBSCAN+,":[191],"identify":[193],"significant":[194],"density":[198],"connected.":[199],"will":[202],"show,":[203],"incorporation":[204],"powerful":[210],"mechanism":[211],"allows":[213],"new":[215],"DBSCAN+":[217,241],"outperform":[219],"state-of-the-art":[220],"various":[224],"scenarios.":[225],"We":[226],"also":[227],"computational":[229],"enhancements":[230],"speed-up":[232],"proposed":[234],"approach.":[235],"Experiment":[236],"results":[237,266],"show":[238],"can":[242,286],"simultaneously":[243],"improve":[244,287],"success":[246],"true":[249],"cluster":[250],"10\u201320%":[253],"increases":[254],"absolute":[256],"F1":[257],"scores)":[258],"substantially":[260],"reduce":[261],"from":[268],"thousands/hundreds":[269],"detections":[272],"none":[274],"just":[276],"few":[278],"across":[279],"100":[280],"datasets),":[281],"acceleration":[284],"methods":[285],"efficiency":[289],"clustered":[292],"non-clustered":[294],"data.":[295]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
