{"id":"https://openalex.org/W2759894926","doi":"https://doi.org/10.15439/2017f82","title":"Preprocessing compensation techniques for improved classification of imbalanced medical datasets","display_name":"Preprocessing compensation techniques for improved classification of imbalanced medical datasets","publication_year":2017,"publication_date":"2017-09-24","ids":{"openalex":"https://openalex.org/W2759894926","doi":"https://doi.org/10.15439/2017f82","mag":"2759894926"},"language":"en","primary_location":{"id":"doi:10.15439/2017f82","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f82","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/82.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://annals-csis.org/proceedings/2017/drp/pdf/82.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057494227","display_name":"Agnieszka Wosiak","orcid":"https://orcid.org/0000-0001-6124-1236"},"institutions":[{"id":"https://openalex.org/I188884621","display_name":"Lodz University of Technology","ror":"https://ror.org/00s8fpf52","country_code":"PL","type":"education","lineage":["https://openalex.org/I188884621"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Agnieszka Wosiak","raw_affiliation_strings":["Lodz University of Technology Institute of Information Technology ul. Wolczanska 215 90-924 Lodz, Poland"],"affiliations":[{"raw_affiliation_string":"Lodz University of Technology Institute of Information Technology ul. Wolczanska 215 90-924 Lodz, Poland","institution_ids":["https://openalex.org/I188884621"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068011437","display_name":"Sylwia Karbowiak","orcid":null},"institutions":[{"id":"https://openalex.org/I188884621","display_name":"Lodz University of Technology","ror":"https://ror.org/00s8fpf52","country_code":"PL","type":"education","lineage":["https://openalex.org/I188884621"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Sylwia Karbowiak","raw_affiliation_strings":["Lodz University of Technology Institute of Information Technology ul. Wolczanska 215 90-924 Lodz, Poland"],"affiliations":[{"raw_affiliation_string":"Lodz University of Technology Institute of Information Technology ul. Wolczanska 215 90-924 Lodz, Poland","institution_ids":["https://openalex.org/I188884621"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5057494227"],"corresponding_institution_ids":["https://openalex.org/I188884621"],"apc_list":null,"apc_paid":null,"fwci":0.5192,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.73139598,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"11","issue":null,"first_page":"203","last_page":"211"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.8124603033065796},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7666580677032471},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6122023463249207},{"id":"https://openalex.org/keywords/resampling","display_name":"Resampling","score":0.607891857624054},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5763139724731445},{"id":"https://openalex.org/keywords/multiclass-classification","display_name":"Multiclass classification","score":0.542790412902832},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5153967142105103},{"id":"https://openalex.org/keywords/statistical-classification","display_name":"Statistical classification","score":0.5064476728439331},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49717190861701965},{"id":"https://openalex.org/keywords/binary-classification","display_name":"Binary classification","score":0.49156007170677185},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4640231728553772},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4587097764015198},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.2803490161895752}],"concepts":[{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.8124603033065796},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7666580677032471},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6122023463249207},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.607891857624054},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5763139724731445},{"id":"https://openalex.org/C123860398","wikidata":"https://www.wikidata.org/wiki/Q6934605","display_name":"Multiclass classification","level":3,"score":0.542790412902832},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5153967142105103},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.5064476728439331},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49717190861701965},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.49156007170677185},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4640231728553772},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4587097764015198},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.2803490161895752}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.15439/2017f82","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f82","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/82.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.15439/2017f82","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f82","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/82.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2759894926.pdf","grobid_xml":"https://content.openalex.org/works/W2759894926.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W129457532","https://openalex.org/W1013989637","https://openalex.org/W1596339832","https://openalex.org/W1835740130","https://openalex.org/W1954721612","https://openalex.org/W1965895350","https://openalex.org/W1996020380","https://openalex.org/W2015452969","https://openalex.org/W2070390828","https://openalex.org/W2070808135","https://openalex.org/W2088059023","https://openalex.org/W2090135786","https://openalex.org/W2110118110","https://openalex.org/W2111164709","https://openalex.org/W2114968414","https://openalex.org/W2115114820","https://openalex.org/W2118978333","https://openalex.org/W2136903812","https://openalex.org/W2148143831","https://openalex.org/W2164341120","https://openalex.org/W2186874741","https://openalex.org/W2226725405","https://openalex.org/W2310231101","https://openalex.org/W2337518838","https://openalex.org/W2471037569","https://openalex.org/W2505283872","https://openalex.org/W2514173981","https://openalex.org/W2526705631","https://openalex.org/W2577222694","https://openalex.org/W2584414757","https://openalex.org/W2602330513","https://openalex.org/W2614183994","https://openalex.org/W6737563499"],"related_works":["https://openalex.org/W4376528628","https://openalex.org/W1537592868","https://openalex.org/W2470590370","https://openalex.org/W3176009750","https://openalex.org/W3207192536","https://openalex.org/W2910954186","https://openalex.org/W1748436461","https://openalex.org/W2002271516","https://openalex.org/W2014610539","https://openalex.org/W3172103400"],"abstract_inverted_index":{"The":[0,19,63,90],"paper":[1],"describes":[2],"the":[3,6,22,42,46,57,85,123],"study":[4,91],"on":[5,67,82],"problem":[7],"of":[8,21,48,55,101,125],"applying":[9],"classification":[10,31,86,108,137],"techniques":[11],"in":[12],"medical":[13],"datasets":[14,58,69,96,115],"with":[15,87,116],"a":[16,99,102,107],"class":[17,52],"imbalance.":[18],"aim":[20],"research":[23],"is":[24],"to":[25,40],"identify":[26],"factors":[27],"that":[28,36,93],"negatively":[29],"affect":[30],"results":[32],"and":[33,50,61,72,84,106,136],"propose":[34],"actions":[35],"may":[37,129],"be":[38,130],"taken":[39],"improve":[41],"performance.":[43],"To":[44],"alleviate":[45],"impact":[47],"uneven":[49],"complex":[51,117],"distribution,":[53],"methods":[54,80],"balancing":[56],"are":[59],"proposed":[60],"compared.":[62],"experiments":[64],"were":[65],"conducted":[66],"five":[68],"-three":[70],"binary":[71],"two":[73],"multiclass.":[74],"They":[75],"comprise":[76],"several":[77],"data":[78,83],"preprocessing":[79,104],"applied":[81],"different":[88],"techniques.":[89],"shows":[92],"for":[94],"some":[95],"there":[97],"exists":[98],"combination":[100],"certain":[103],"method":[105,135],"technique":[109,138],"which":[110],"outperforms":[111],"other":[112],"approaches.":[113],"For":[114],"distribution":[118],"or":[119],"too":[120],"many":[121],"features":[122],"ratio":[124],"correctly":[126],"predicted":[127],"labels":[128],"low":[131],"regardless":[132],"what":[133],"resampling":[134],"has":[139],"been":[140],"applied.":[141]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
