{"id":"https://openalex.org/W4417339059","doi":"https://doi.org/10.1109/ictai66417.2025.00180","title":"Reliable Brain Tumor Classification Without Metadata: A Step-by-Step Guideline with Duplicate Removal","display_name":"Reliable Brain Tumor Classification Without Metadata: A Step-by-Step Guideline with Duplicate Removal","publication_year":2025,"publication_date":"2025-11-03","ids":{"openalex":"https://openalex.org/W4417339059","doi":"https://doi.org/10.1109/ictai66417.2025.00180"},"language":null,"primary_location":{"id":"doi:10.1109/ictai66417.2025.00180","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictai66417.2025.00180","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 37th International Conference on Tools with Artificial Intelligence (ICTAI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119867753","display_name":"Mohiuddin Saifullah","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Mohiuddin Saifullah","raw_affiliation_strings":["Nara Institute of Science and Technology,Data-driven Biology,Nara,Japan"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology,Data-driven Biology,Nara,Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037742021","display_name":"Daniel Baldauf","orcid":"https://orcid.org/0000-0001-5764-506X"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Daniel Baldauf","raw_affiliation_strings":["University of Trento,CIMeC,Department of Psychology and Cognitive Science,Trento,Italy"],"affiliations":[{"raw_affiliation_string":"University of Trento,CIMeC,Department of Psychology and Cognitive Science,Trento,Italy","institution_ids":["https://openalex.org/I193223587"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003925893","display_name":"Yuichi Sakumura","orcid":"https://orcid.org/0000-0003-0065-2239"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuichi Sakumura","raw_affiliation_strings":["Nara Institute of Science and Technology,Data-driven Biology,Nara,Japan"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology,Data-driven Biology,Nara,Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5119867753"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45677419,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1237","last_page":"1244"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.4223000109195709,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.4223000109195709,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.08609999716281891,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10129","display_name":"Glioma Diagnosis and Treatment","score":0.06769999861717224,"subfield":{"id":"https://openalex.org/subfields/2716","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/guideline","display_name":"Guideline","score":0.5541999936103821},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3885999917984009},{"id":"https://openalex.org/keywords/brain-tumor","display_name":"Brain tumor","score":0.3869999945163727},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data sharing","score":0.3382999897003174},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.31209999322891235},{"id":"https://openalex.org/keywords/clinical-practice","display_name":"Clinical Practice","score":0.3012999892234802},{"id":"https://openalex.org/keywords/risk-stratification","display_name":"Risk stratification","score":0.296999990940094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6324999928474426},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5598000288009644},{"id":"https://openalex.org/C2780182762","wikidata":"https://www.wikidata.org/wiki/Q1630279","display_name":"Guideline","level":2,"score":0.5541999936103821},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43880000710487366},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4277999997138977},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.39320001006126404},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3885999917984009},{"id":"https://openalex.org/C2779130545","wikidata":"https://www.wikidata.org/wiki/Q233309","display_name":"Brain tumor","level":2,"score":0.3869999945163727},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.3382999897003174},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C2779974597","wikidata":"https://www.wikidata.org/wiki/Q28448986","display_name":"Clinical Practice","level":2,"score":0.3012999892234802},{"id":"https://openalex.org/C3020404979","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk stratification","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28780001401901245},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.27970001101493835},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.2646999955177307},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C71472368","wikidata":"https://www.wikidata.org/wiki/Q676880","display_name":"Text mining","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ictai66417.2025.00180","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ictai66417.2025.00180","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 37th International Conference on Tools with Artificial Intelligence (ICTAI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F2083928842","display_name":"Centro Interdipartimentale Mente/Cervello, Universit\u00e0 degli Studi di Trento","ror":null},{"id":"https://openalex.org/F4320315716","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84"},{"id":"https://openalex.org/F4320322275","display_name":"Universit\u00e0 degli Studi di Trento","ror":"https://ror.org/05trd4x28"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2101807845","https://openalex.org/W2559975580","https://openalex.org/W2963255684","https://openalex.org/W2992703694","https://openalex.org/W3182952703","https://openalex.org/W4224271142","https://openalex.org/W4281682624","https://openalex.org/W4298140399","https://openalex.org/W4377989430","https://openalex.org/W4387849447","https://openalex.org/W4399534613","https://openalex.org/W4399984712","https://openalex.org/W4406681871","https://openalex.org/W4407392585","https://openalex.org/W4410228127"],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"brain":[1,193],"tumor":[2,194],"classification":[3],"with":[4,105,154],"deep":[5],"learning":[6],"can":[7,89],"significantly":[8],"support":[9],"diagnosis":[10],"and":[11,27,38,82,95,102,108,139,149,152,165],"treatment":[12],"planning.":[13],"While":[14],"publicly":[15,57],"available":[16,58],"datasets":[17,46,73],"have":[18],"greatly":[19],"advanced":[20],"research,":[21],"they":[22],"often":[23],"lack":[24],"crucial":[25],"clinical":[26],"demographic":[28],"metadata,":[29],"making":[30],"it":[31],"difficult":[32],"to":[33,44,54,80,169,180],"implement":[34],"proper":[35],"data":[36,163,178],"splitting":[37],"safeguard":[39],"against":[40],"information":[41],"leakage.":[42],"Access":[43],"hospital-sourced":[45],"remains":[47],"extremely":[48],"limited,":[49],"so":[50],"the":[51,145,159],"community":[52],"continues":[53],"rely":[55],"on":[56],"imaging":[59],"datasets.":[60],"In":[61],"this":[62],"work,":[63],"we":[64,97,143],"propose":[65],"a":[66,112,121],"practical,":[67],"step-by-step":[68],"guideline":[69],"for":[70],"using":[71,147],"such":[72],"responsibly.":[74],"We":[75,126,175],"apply":[76],"perceptual":[77],"hashing":[78],"(pHash)":[79],"detect":[81],"remove":[83],"duplicate":[84],"or":[85],"near-duplicate":[86],"images,":[87],"which":[88],"otherwise":[90],"inflate":[91],"performance.":[92],"Using":[93],"EfficientNetB0":[94],"InceptionV3,":[96],"compare":[98],"model":[99,146],"performance":[100],"before":[101],"after":[103],"de-duplication":[104],"stratified":[106],"splits":[107],"nested":[109,118,150],"cross-validation.":[110],"Despite":[111],"slight":[113],"drop":[114],"in":[115,189],"test":[116],"accuracy,":[117],"validation":[119,173],"reveals":[120],"clearer":[122],"picture":[123],"of":[124,161],"generalizability.":[125],"also":[127,176],"report":[128],"detailed":[129],"metrics":[130],"including":[131],"F2-score,":[132],"MCC,":[133],"CSI,":[134],"PR":[135],"AUC,":[136],"Cohen's":[137],"Kappa,":[138],"Log":[140],"Loss.":[141],"Finally,":[142],"evaluated":[144],"k-fold":[148],"crossvalidation,":[151],"interpreted":[153],"LIME.":[155],"Our":[156],"study":[157],"highlights":[158],"importance":[160],"addressing":[162],"leakage":[164,182],"encourages":[166],"future":[167],"researchers":[168],"adopt":[170],"more":[171],"rigorous":[172],"practices.":[174],"urge":[177],"providers":[179],"consider":[181],"risks":[183],"when":[184],"sharing":[185],"medical":[186],"datasets,":[187],"especially":[188],"sensitive":[190],"domains":[191],"like":[192],"analysis.":[195]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-12-15T00:00:00"}
