{"id":"https://openalex.org/W6906577855","doi":"https://doi.org/10.18420/muc2021-mci-ws02-284","title":"How can Small Data Sets be Clustered?","display_name":"How can Small Data Sets be Clustered?","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W6906577855","doi":"https://doi.org/10.18420/muc2021-mci-ws02-284"},"language":"en","primary_location":{"id":"pmh:oai:opus.hs-emden-leer.de:850","is_oa":false,"landing_page_url":"https://opus.hs-emden-leer.de/frontdoor/index/index/docId/850","pdf_url":null,"source":{"id":"https://openalex.org/S7407053446","display_name":"Hochschulschriftenserver der Hochschule Emden/Leer","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"doc-type:conferenceObject"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.18420/muc2021-mci-ws02-284","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Weigand, Anna Christina","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Weigand, Anna Christina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Lange, Daniel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lange, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Rauschenberger, Maria","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rauschenberger, Maria","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4079,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.70652504,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.22380000352859497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.22380000352859497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.03480000048875809,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.02800000086426735,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8367999792098999},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.6639999747276306},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4896000027656555},{"id":"https://openalex.org/keywords/data-stream-clustering","display_name":"Data stream clustering","score":0.476500004529953},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.46779999136924744},{"id":"https://openalex.org/keywords/clustering-high-dimensional-data","display_name":"Clustering high-dimensional data","score":0.4666999876499176},{"id":"https://openalex.org/keywords/conceptual-clustering","display_name":"Conceptual clustering","score":0.4537999927997589},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4505000114440918},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.4472000002861023}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8367999792098999},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7013000249862671},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.6639999747276306},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5530999898910522},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5257999897003174},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5041000247001648},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4896000027656555},{"id":"https://openalex.org/C193143536","wikidata":"https://www.wikidata.org/wiki/Q5227360","display_name":"Data stream clustering","level":5,"score":0.476500004529953},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.46779999136924744},{"id":"https://openalex.org/C184509293","wikidata":"https://www.wikidata.org/wiki/Q5136711","display_name":"Clustering high-dimensional data","level":3,"score":0.4666999876499176},{"id":"https://openalex.org/C39235581","wikidata":"https://www.wikidata.org/wiki/Q5158434","display_name":"Conceptual clustering","level":5,"score":0.4537999927997589},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4505000114440918},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.4472000002861023},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.4431000053882599},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.4350000023841858},{"id":"https://openalex.org/C46576248","wikidata":"https://www.wikidata.org/wiki/Q1114630","display_name":"DBSCAN","level":5,"score":0.4287000000476837},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C186767784","wikidata":"https://www.wikidata.org/wiki/Q5162841","display_name":"Consensus clustering","level":5,"score":0.3921999931335449},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.37869998812675476},{"id":"https://openalex.org/C2779280203","wikidata":"https://www.wikidata.org/wiki/Q17121211","display_name":"Small data","level":2,"score":0.376800000667572},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C27964816","wikidata":"https://www.wikidata.org/wiki/Q5164359","display_name":"Constrained clustering","level":5,"score":0.3287000060081482},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.3111000061035156},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.3107999861240387},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C111442797","wikidata":"https://www.wikidata.org/wiki/Q7291446","display_name":"Rand index","level":3,"score":0.2639999985694885},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:opus.hs-emden-leer.de:850","is_oa":false,"landing_page_url":"https://opus.hs-emden-leer.de/frontdoor/index/index/docId/850","pdf_url":null,"source":{"id":"https://openalex.org/S7407053446","display_name":"Hochschulschriftenserver der Hochschule Emden/Leer","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"doc-type:conferenceObject"},{"id":"doi:10.18420/muc2021-mci-ws02-284","is_oa":true,"landing_page_url":"https://doi.org/10.18420/muc2021-mci-ws02-284","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.18420/muc2021-mci-ws02-284","is_oa":true,"landing_page_url":"https://doi.org/10.18420/muc2021-mci-ws02-284","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article-journal"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6999978423118591,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0,23,65,103],"many":[1],"areas,":[2],"only":[3],"small":[4,32,131,165],"data":[5,11,33,82,132,166],"sets":[6,34],"are":[7,50],"available":[8],"and":[9,47,101,107,135],"big":[10],"does":[12],"not":[13,115],"play":[14],"a":[15,61,78,156],"significant":[16],"role,":[17],"e.g.,":[18,58],"in":[19,60,138],"Human-Centered":[20],"Design":[21,143],"research.":[22],"the":[24,75,161],"context":[25],"of":[26,31,77,148,163],"machine":[27,70,149],"learning":[28,71,150],"analysis,":[29],"results":[30,49],"can":[35,145],"be":[36],"biased":[37],"due":[38],"to":[39,129],"single":[40],"variables":[41],"or":[42],"missing":[43],"values.":[44],"Nevertheless,":[45],"reliable":[46],"interpretable":[48],"essential":[51],"for":[52,159],"determining":[53],"further":[54],"actions,":[55],"such":[56],"as,":[57],"treatments":[59],"health-related":[62,80],"use":[63],"case.":[64],"this":[66],"paper,":[67],"we":[68,89,123],"explore":[69],"clustering":[72,93,97,134,151,164],"algorithms":[73,94],"on":[74,120,127],"basis":[76],"small,":[79],"(variance)":[81],"set":[83,133],"about":[84],"early":[85],"dyslexia":[86],"screening.":[87],"Therefore,":[88],"selected":[90],"three":[91],"different":[92,96],"from":[95],"methods:":[98],"K-Means,":[99],"HAC":[100,108],"DBSCAN.":[102],"our":[104,121],"case,":[105],"K-Means":[106],"showed":[109],"promising":[110],"results,":[111],"while":[112],"DBSCAN":[113],"did":[114],"deliver":[116],"distinct":[117],"results.":[118,152],"Based":[119],"experiences,":[122],"provide":[124],"first":[125],"proposals":[126],"how":[128],"handle":[130],"describe":[136],"situations":[137],"which":[139],"using":[140],"Human-":[141],"Centered":[142],"methods":[144],"increase":[146],"interpretability":[147],"Our":[153],"work":[154],"represents":[155],"starting":[157],"point":[158],"discussing":[160],"topic":[162],"sets.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
