{"id":"https://openalex.org/W7077467261","doi":"https://doi.org/10.48550/arxiv.2508.16224","title":"Self-Validated Learning for Particle Separation: A Correctness-Based Self-Training Framework Without Human Labels","display_name":"Self-Validated Learning for Particle Separation: A Correctness-Based Self-Training Framework Without Human Labels","publication_year":2025,"publication_date":"2025-08-22","ids":{"openalex":"https://openalex.org/W7077467261","doi":"https://doi.org/10.48550/arxiv.2508.16224"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2508.16224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.16224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2508.16224","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"L\u00f6sel, Philipp D.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"L\u00f6sel, Philipp D.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Barron, Aleese","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barron, Aleese","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Yulai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yulai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Fabian, Matthias","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fabian, Matthias","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Young, Benjamin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Young, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Francois, Nicolas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Francois, Nicolas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Kingston, Andrew M.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kingston, Andrew M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6316999793052673,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6316999793052673,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13067","display_name":"Geological Modeling and Analysis","score":0.024399999529123306,"subfield":{"id":"https://openalex.org/subfields/1906","display_name":"Geochemistry and Petrology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14311","display_name":"Electrical and Electromagnetic Research","score":0.023000000044703484,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6820999979972839},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5727999806404114},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.5404000282287598},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5386000275611877},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5347999930381775},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47749999165534973},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.42570000886917114},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.39739999175071716},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.38510000705718994}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7382000088691711},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6820999979972839},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6741999983787537},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5727999806404114},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.5404000282287598},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5386000275611877},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5347999930381775},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49779999256134033},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47749999165534973},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.42570000886917114},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.39739999175071716},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.38510000705718994},{"id":"https://openalex.org/C2778517922","wikidata":"https://www.wikidata.org/wiki/Q7140482","display_name":"Particle (ecology)","level":2,"score":0.38449999690055847},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.350600004196167},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3228999972343445},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.31940001249313354},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3084999918937683},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.3021000027656555},{"id":"https://openalex.org/C150547873","wikidata":"https://www.wikidata.org/wiki/Q947851","display_name":"Watershed","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.28540000319480896},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2847999930381775},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2621999979019165},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.2551000118255615}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2508.16224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.16224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2508.16224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.16224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Non-destructive":[0],"3D":[1],"imaging":[2],"of":[3,32,52,125,135,154,169],"large":[4],"multi-particulate":[5],"samples":[6],"is":[7,199],"essential":[8],"for":[9,91,99,184],"quantifying":[10],"particle-level":[11],"properties,":[12],"such":[13],"as":[14,188],"size,":[15],"shape,":[16],"and":[17,26,44,76,108,159],"spatial":[18],"distribution,":[19],"across":[20,122],"applications":[21],"in":[22,34,166],"mining,":[23],"materials":[24],"science,":[25],"geology.":[27],"However,":[28],"accurate":[29],"instance":[30,93,194],"segmentation":[31,94,195],"particles":[33,116,165],"tomographic":[35,167],"data":[36],"remains":[37],"challenging":[38],"due":[39],"to":[40,78],"high":[41],"morphological":[42],"variability":[43],"frequent":[45],"particle":[46,92,157],"contact,":[47],"which":[48],"limit":[49],"the":[50,97,111,126,133,155,173,182,202],"effectiveness":[51],"classical":[53],"methods":[54],"like":[55],"watershed":[56],"algorithms.":[57],"While":[58],"supervised":[59],"deep":[60],"learning":[61,140],"approaches":[62],"offer":[63],"improved":[64],"performance,":[65],"they":[66],"rely":[67],"on":[68],"extensive":[69],"annotated":[70],"datasets":[71],"that":[72,95,117],"are":[73],"labor-intensive,":[74],"error-prone,":[75],"difficult":[77],"scale.":[79],"In":[80],"this":[81],"work,":[82],"we":[83],"propose":[84],"self-validated":[85],"learning,":[86],"a":[87],"novel":[88],"self-training":[89],"framework":[90,174],"eliminates":[96],"need":[98,183],"manual":[100],"annotations.":[101],"Our":[102],"method":[103,198],"leverages":[104],"implicit":[105],"boundary":[106],"detection":[107],"iteratively":[109],"refines":[110],"training":[112],"set":[113],"by":[114],"identifying":[115],"can":[118],"be":[119],"consistently":[120],"matched":[121],"reshuffled":[123],"scans":[124,168],"same":[127],"sample.":[128],"This":[129],"self-validation":[130],"mechanism":[131],"mitigates":[132],"impact":[134],"noisy":[136],"pseudo-labels,":[137],"enabling":[138],"robust":[139],"from":[141],"unlabeled":[142],"data.":[143],"After":[144],"just":[145],"three":[146],"iterations,":[147],"our":[148],"approach":[149],"accurately":[150],"segments":[151],"over":[152],"97%":[153],"total":[156],"volume":[158],"identifies":[160],"more":[161],"than":[162],"54,000":[163],"individual":[164],"quartz":[170],"fragments.":[171],"Importantly,":[172],"also":[175],"enables":[176],"fully":[177],"autonomous":[178],"model":[179],"evaluation":[180],"without":[181],"ground":[185],"truth":[186],"annotations,":[187],"confirmed":[189],"through":[190],"comparisons":[191],"with":[192],"state-of-the-art":[193],"techniques.":[196],"The":[197],"integrated":[200],"into":[201],"Biomedisa":[203],"image":[204],"analysis":[205],"platform":[206],"(https://github.com/biomedisa/biomedisa/).":[207]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
