{"id":"https://openalex.org/W4393886628","doi":"https://doi.org/10.5281/zenodo.5578330","title":"Fuzzy Overclustering","display_name":"Fuzzy Overclustering","publication_year":2021,"publication_date":"2021-10-05","ids":{"openalex":"https://openalex.org/W4393886628","doi":"https://doi.org/10.5281/zenodo.5578330"},"language":"en","primary_location":{"id":"pmh:oai:zenodo.org:5578330","is_oa":true,"landing_page_url":"https://zenodo.org/record/5578330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors 21","raw_type":"info:eu-repo/semantics/other"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/5578330","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022955518","display_name":"Lars Schmarje","orcid":"https://orcid.org/0000-0002-6945-5957"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Schmarje, Lars","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-6945-5957","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022128365","display_name":"Johannes Br\u00fcnger","orcid":"https://orcid.org/0000-0002-5118-145X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Br\u00fcnger, Johannes","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-5118-145X","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074395199","display_name":"Monty Santarossa","orcid":"https://orcid.org/0000-0002-4159-1367"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Santarossa, Monty","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-4159-1367","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067670733","display_name":"Simon\u2010Martin Schr\u00f6der","orcid":"https://orcid.org/0000-0002-6603-9907"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schr\u00f6der, Simon-Martin","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-6603-9907","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059058911","display_name":"Rainer Kiko","orcid":"https://orcid.org/0000-0002-7851-9107"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kiko, Rainer","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-7851-9107","affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5040944275","display_name":"Reinhard Koch","orcid":"https://orcid.org/0000-0003-4398-1569"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koch, Reinhard","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0003-4398-1569","affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5022955518"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11891","display_name":"Big Data and Business Intelligence","score":0.5163000226020813,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11891","display_name":"Big Data and Business Intelligence","score":0.5163000226020813,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.42781826853752136}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42781826853752136}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:zenodo.org:5578330","is_oa":true,"landing_page_url":"https://zenodo.org/record/5578330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors 21","raw_type":"info:eu-repo/semantics/other"},{"id":"doi:10.5281/zenodo.5578330","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.5578330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:5578330","is_oa":true,"landing_page_url":"https://zenodo.org/record/5578330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors 21","raw_type":"info:eu-repo/semantics/other"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"The":[0,25,120,130,141,220,269,303,417,481,506,545,581,597,614,624],"datasets":[1,110],"used":[2,106,174,340,368,383,589,598],"for":[3,376,492,514,606,616,626],"the":[4,19,33,105,112,117,158,175,205,208,211,241,247,250,257,288,315,334,354,362,391,436,439,450,455,470,474,477,510,524,527,534,567,588,617,627],"paper":[5,393,569],"\"Fuzzy":[6],"Overclustering:":[7,65],"Semi-supervised":[8],"classification":[9],"of":[10,68,137,181,223,240,256,261,287,306,326,405,438,454,476,484],"fuzzy":[11,468,489,543],"labels":[12,600],"with":[13,71,111,145,414],"overclustering":[14],"and":[15,32,47,50,53,56,59,73,108,151,213,318,343,378,407,424,449,469,487,495,538,556,585,594],"inverse":[16],"cross-entropy\"":[17],"in":[18,197,295,309,519,530],"open":[20],"access":[21],"journal":[22],"Sensors":[23],"(https://doi.org/10.3390/s21196661).":[24],"source":[26],"code":[27],"is":[28,185,225,402,431,441,457,466,473,518,601,611,620,630],"available":[29,187,355],"at":[30,35,193],"https://github.com/Emprime/FuzzyOverclustering":[31],"preprint":[34],"https://arxiv.org/abs/2110.06630":[36],".":[37],"<br>":[38,102,126,129,396,399,572,575],"Please":[39],"cite":[40],"as":[41,369,433,553,622,632],"<pre><code>@Article{Schmarje2021foc,":[42],"AUTHOR":[43],"=":[44,63,77,80,83,86,89,92,96,99],"{Schmarje,":[45],"Lars":[46],"Br\u00fcnger,":[48],"Johannes":[49],"Santarossa,":[51],"Monty":[52],"Schr\u00f6der,":[54],"Simon-Martin":[55],"Kiko,":[57],"Rainer":[58],"Koch,":[60],"Reinhard},":[61],"TITLE":[62],"{Fuzzy":[64],"Semi-Supervised":[66],"Classification":[67],"Fuzzy":[69,546],"Labels":[70],"Overclustering":[72],"Inverse":[74],"Cross-Entropy},":[75],"JOURNAL":[76],"{Sensors},":[78],"VOLUME":[79],"{21},":[81],"YEAR":[82],"{2021},":[84],"NUMBER":[85],"{19},":[87],"ARTICLE-NUMBER":[88],"{6661},":[90],"URL":[91],"{https://www.mdpi.com/1424-8220/21/19/6661;":[93],"https://doi.org/10.5281/zenodo.5550919},":[94],"ISSN":[95],"{1424-8220},":[97],"DOI":[98],"{10.3390/s21196661}":[100],"}</code></pre>":[101],"We":[103,173,313,339,349,499],"provide":[104],"plankton":[107,131,618],"synthetic":[109,628],"following":[113],"explanations":[114],"summarized":[115],"from":[116,353,533],"above-mentioned":[118],"paper.":[119],"technical":[121],"descriptions":[122],"are":[123,152,214,272,331,367,421],"given":[124,602],"below.":[125],"<strong>Plankton":[127],"Dataset</strong><br>":[128],"dataset":[132,290,304,401,482],"contains":[133],"diverse":[134],"grey-level":[135],"images":[136,142,230,308,330,346,352,366,375,491,552],"marine":[138],"planktonic":[139],"organisms.":[140],"were":[143,380],"captured":[144],"an":[146,540],"Underwater":[147],"Vision":[148],"Profiler":[149],"5":[150],"hosted":[153],"on":[154,361,410],"EcoTaxa":[155],"(https://ecotaxa.obs-vlfr.fr/).":[156],"In":[157],"citizen":[159,171],"science":[160],"project":[161],"PlanktonID":[162,224,262,289],"(https://planktonid.geomar.de/en),":[163],"each":[164,607],"sample":[165],"was":[166],"classified":[167],"multiple":[168],"times":[169],"by":[170,178,274],"scientists.":[172],"data":[176,356,497,555,590,619,629],"generated":[177,273],"version":[179,184,198,222],"two":[180],"PlanktonID.":[182],"This":[183,400],"only":[186,548],"to":[188,216,245,252,297,333],"users":[189],"which":[190,517],"have":[191,291],"done":[192],"least":[194],"1000":[195,488],"annotations":[196],"one.":[199],"Therefore,":[200],"we":[201,382],"can":[202,231],"assume":[203],"that":[204],"annotators":[206,359],"know":[207],"differences":[209],"between":[210],"classes":[212,243,259,286,317,322,325,420,529],"dedicated":[215],"creating":[217],"consistent":[218],"results.":[219],"second":[221],"a":[226,264,275,279,403,411,558,603],"game":[227],"where":[228,357],"example":[229],"be":[232,283],"sorted":[233],"into":[234],"three":[235,300,501],"proposed":[236,242],"classes.":[237,312,480],"If":[238,372],"none":[239],"seem":[244],"fit,":[246],"user":[248],"has":[249],"option":[251],"select":[253],"any":[254],"other":[255,329,365,464],"28":[258,311],"(https://planktonid.geomar.de/en/classes)":[260],"(including":[263],"'no":[265,336],"fitting":[266,337],"category'":[267],"class).":[268],"initial":[270],"proposals":[271],"neural":[276],"network,":[277],"hence,":[278],"confirmation":[280],"bias":[281],"might":[282],"introduced.":[284],"Some":[285],"very":[292],"few":[293],"examples":[294],"comparison":[296],"others":[298],"(e.g.":[299,323],"single":[301],"images).<br>":[302],"consists":[305,483],"12,280":[307],"originally":[310],"picked":[314,532],"largest":[316],"merged":[319],"some":[320],"smaller":[321],"different":[324,415],"detritus).":[327],"All":[328,364],"assigned":[332],"class":[335],"category'.":[338],"400":[341],"training":[342,377,554,560],"200":[344],"validation":[345,379,494],"per":[347],"class.":[348],"selected":[350],"these":[351],"all":[358],"agreed":[360],"label.":[363],"unlabeled":[370,496,586],"data.":[371],"not":[373,521],"enough":[374],"available,":[381],"random":[384],"duplicates.<br>":[385],"For":[386,523,562],"more":[387,563],"details":[388,564],"please":[389,565],"see":[390,566],"main":[392,451,568],"(":[394,570],"https://doi.org/10.3390/s21196661).<br>":[395,571],"<strong>Synthetic":[397],"Datasets</strong><br>":[398],"mixture":[404],"circles":[406,426],"ellipses":[408],"(bubbles)":[409],"black":[412],"background":[413],"colors.":[416],"6":[418,478],"ground-truth":[419,471,479,512,528,535,599],"blue,":[422],"red":[423],"green":[425],"or":[427,446,460],"ellipses.":[428],"An":[429],"image":[430,516,610],"defined":[432,500],"certain":[434,486,550],"if":[435],"hue":[437],"color":[440],"0":[442],"(red),":[443],"120":[444],"(green)":[445],"240":[447],"(blue)":[448],"axis":[452],"ratio":[453],"bubble":[456],"1":[458],"(circle)":[459],"2":[461],"(ellipse).":[462],"Every":[463],"datapoint":[465],"considered":[467],"label":[472,513,536],"interpolation":[475],"1800":[485],"labeled":[490,551],"train,":[493,583],"split.<br>":[498],"subsets:":[502],"Ideal,":[503],"Real,":[504],"Fuzzy.":[505],"Ideal":[507],"subset":[508,547],"uses":[509,549],"majority":[511],"every":[515],"Reality":[520],"available.":[522],"Real":[525],"subset,":[526],"randomly":[531],"distribution":[537],"represent":[539,557,587],"noisy":[541],"/":[542],"annotation.":[544],"cleaned":[559],"dataset.<br>":[561],"<strong>Technical":[573],"description</strong><br>":[574],"Each":[576,609],"folder":[577,604],"represents":[578],"one":[579,612],"dataset.":[580],"subfolders":[582],"val":[584],"splits":[591],"Training,":[592],"Validation":[593],"Unlabeled":[595],"respectively.":[596],"name":[605],"image.":[608],"datapoint.<br>":[613],"filename":[615,625],"structured":[621,631],"&lt;CLASS&gt;-&lt;ECOTAXA_ID&gt;.png<br>":[623],"&lt;SAMPLE<em>COUNTER&gt;-&lt;HUE</em>VALUE&gt;-&lt;AXIS_RATIO&gt;.png":[633]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
