{"id":"https://openalex.org/W3196782388","doi":"https://doi.org/10.1080/08839514.2021.1975393","title":"A New Hybrid Under-sampling Approach to Imbalanced Classification Problems","display_name":"A New Hybrid Under-sampling Approach to Imbalanced Classification Problems","publication_year":2021,"publication_date":"2021-09-06","ids":{"openalex":"https://openalex.org/W3196782388","doi":"https://doi.org/10.1080/08839514.2021.1975393","mag":"3196782388"},"language":"en","primary_location":{"id":"doi:10.1080/08839514.2021.1975393","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839514.2021.1975393","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839514.2021.1975393?needAccess=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839514.2021.1975393?needAccess=true","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077813933","display_name":"Chun-Yang Peng","orcid":"https://orcid.org/0000-0002-3345-4493"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun-Yang Peng","raw_affiliation_strings":["Department of Industrial Engineering and Management, National Taipei University of Technology, Taipei, Taiwan, R.O.C"],"raw_orcid":"https://orcid.org/0000-0002-3345-4493","affiliations":[{"raw_affiliation_string":"Department of Industrial Engineering and Management, National Taipei University of Technology, Taipei, Taiwan, R.O.C","institution_ids":["https://openalex.org/I118292597"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029786947","display_name":"You\u2010Jin Park","orcid":"https://orcid.org/0000-0002-1006-5380"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"You-Jin Park","raw_affiliation_strings":["Department of Industrial Engineering and Management, National Taipei University of Technology, Taipei, Taiwan, R.O.C"],"raw_orcid":"https://orcid.org/0000-0002-1006-5380","affiliations":[{"raw_affiliation_string":"Department of Industrial Engineering and Management, National Taipei University of Technology, Taipei, Taiwan, R.O.C","institution_ids":["https://openalex.org/I118292597"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5029786947"],"corresponding_institution_ids":["https://openalex.org/I118292597"],"apc_list":{"value":2195,"currency":"USD","value_usd":2195},"apc_paid":null,"fwci":1.3991,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.8506128,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"36","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9668999910354614,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8051722645759583},{"id":"https://openalex.org/keywords/dbscan","display_name":"DBSCAN","score":0.6957189440727234},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.6931561827659607},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6735163927078247},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6703779697418213},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6638773083686829},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.6634442806243896},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5884914994239807},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4980912208557129},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4967663884162903},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.47881871461868286},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.4477975070476532},{"id":"https://openalex.org/keywords/oversampling","display_name":"Oversampling","score":0.44767865538597107},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.44680702686309814},{"id":"https://openalex.org/keywords/local-outlier-factor","display_name":"Local outlier factor","score":0.4377976953983307},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40626096725463867},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.15712875127792358},{"id":"https://openalex.org/keywords/fuzzy-clustering","display_name":"Fuzzy clustering","score":0.10124081373214722},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.08833912014961243},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.06970885396003723}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8051722645759583},{"id":"https://openalex.org/C46576248","wikidata":"https://www.wikidata.org/wiki/Q1114630","display_name":"DBSCAN","level":5,"score":0.6957189440727234},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.6931561827659607},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6735163927078247},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6703779697418213},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6638773083686829},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.6634442806243896},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5884914994239807},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4980912208557129},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4967663884162903},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.47881871461868286},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.4477975070476532},{"id":"https://openalex.org/C197323446","wikidata":"https://www.wikidata.org/wiki/Q331222","display_name":"Oversampling","level":3,"score":0.44767865538597107},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.44680702686309814},{"id":"https://openalex.org/C169029474","wikidata":"https://www.wikidata.org/wiki/Q387942","display_name":"Local outlier factor","level":3,"score":0.4377976953983307},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40626096725463867},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.15712875127792358},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.10124081373214722},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.08833912014961243},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.06970885396003723},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1080/08839514.2021.1975393","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839514.2021.1975393","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839514.2021.1975393?needAccess=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b7d54a104d5242ba99be2351342303a8","is_oa":false,"landing_page_url":"https://doaj.org/article/b7d54a104d5242ba99be2351342303a8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Applied Artificial Intelligence, Vol 36, Iss 1 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1080/08839514.2021.1975393","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839514.2021.1975393","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839514.2021.1975393?needAccess=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3127558330","display_name":null,"funder_award_id":"MOST 110-2221-E-027-106-MY3","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G7232570807","display_name":null,"funder_award_id":"110-2221-E-027-106-MY3","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"}],"funders":[{"id":"https://openalex.org/F4320322795","display_name":"Ministry of Science and Technology, Taiwan","ror":"https://ror.org/02kv4zf79"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3196782388.pdf"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W1542796245","https://openalex.org/W1591261915","https://openalex.org/W1993576344","https://openalex.org/W2007869097","https://openalex.org/W2008286666","https://openalex.org/W2012122611","https://openalex.org/W2033184625","https://openalex.org/W2041193317","https://openalex.org/W2087240369","https://openalex.org/W2096945460","https://openalex.org/W2097521902","https://openalex.org/W2099454382","https://openalex.org/W2104167780","https://openalex.org/W2110020117","https://openalex.org/W2117672932","https://openalex.org/W2118978333","https://openalex.org/W2128965734","https://openalex.org/W2132791018","https://openalex.org/W2144182447","https://openalex.org/W2148143831","https://openalex.org/W2170314592","https://openalex.org/W2286152596","https://openalex.org/W2320075934","https://openalex.org/W2338318698","https://openalex.org/W2534295610","https://openalex.org/W2538771869","https://openalex.org/W2548061775","https://openalex.org/W2562319768","https://openalex.org/W2592842236","https://openalex.org/W2612634114","https://openalex.org/W2736435690","https://openalex.org/W2740924709","https://openalex.org/W2767106145","https://openalex.org/W2807198477","https://openalex.org/W2891398562","https://openalex.org/W2899434936","https://openalex.org/W2908465383","https://openalex.org/W2916113523","https://openalex.org/W2916913565","https://openalex.org/W2943284727","https://openalex.org/W2946096271","https://openalex.org/W3005483246","https://openalex.org/W3014524176","https://openalex.org/W3022206528","https://openalex.org/W3040102849","https://openalex.org/W3046141163","https://openalex.org/W3119102269","https://openalex.org/W3120625981","https://openalex.org/W3173198409"],"related_works":["https://openalex.org/W2499612753","https://openalex.org/W2770832849","https://openalex.org/W3111802945","https://openalex.org/W205872183","https://openalex.org/W114119537","https://openalex.org/W4240627425","https://openalex.org/W2761705761","https://openalex.org/W2912112202","https://openalex.org/W4377236448","https://openalex.org/W2946096271"],"abstract_inverted_index":{"Among":[0],"many":[1],"machine":[2],"learning":[3],"applications,":[4],"classification":[5,13,36,57,67,78,100],"is":[6,29,46,114],"one":[7],"of":[8,24,120,223,233,247],"the":[9,19,22,34,77,93,166,171,175,181,190,195,199,203,210,221,224,238,245,248,252],"important":[10],"tasks.":[11],"Most":[12],"algorithms":[14],"have":[15],"been":[16],"designed":[17],"under":[18],"assumption":[20],"that":[21,90,134],"number":[23],"samples":[25,89,150,169,187,213,218,225,235],"for":[26],"each":[27],"class":[28,42,95,149,259],"approximately":[30],"balanced.":[31],"However,":[32],"if":[33],"conventional":[35],"approaches":[37],"are":[38,215],"applied":[39],"to":[40,48,75,92,146,184,193],"a":[41,53,106],"imbalanced":[43,66],"dataset,":[44],"it":[45],"likely":[47],"cause":[49],"misclassification":[50],"and,":[51],"as":[52,126,128,226],"result,":[54],"may":[55,98],"distort":[56],"performance":[58],"results.":[59],"Thus,":[60],"in":[61,170],"this":[62],"study,":[63],"we":[64,82,104,163,179,207,230],"consider":[65],"problems":[68],"and":[69,87,130,140,160,188,243],"adopt":[70],"an":[71],"efficient":[72],"preprocessing":[73],"technique":[74],"improve":[76],"performances.":[79],"In":[80],"particular,":[81],"focus":[83],"on":[84,116,143,198],"borderline":[85,136,157,167],"noise":[86,123,129,137,168],"outlier":[88,131,186],"belong":[91],"majority":[94,148],"since":[96],"they":[97],"influence":[99],"performance.":[101],"For":[102],"this,":[103],"propose":[105],"hybrid":[107],"resampling":[108],"method,":[109],"called":[110],"BOD-based":[111],"under-sampling,":[112],"which":[113,214],"based":[115,142],"density-based":[117],"spatial":[118],"clustering":[119],"applications":[121],"with":[122,256],"(DBSCAN)":[124],"approach":[125,192],"well":[127],"detection":[132],"methods,":[133],"is,":[135],"factor":[138],"(BNF)":[139],"outlierness":[141],"neighborhood":[144],"(OBN)":[145],"divide":[147],"into":[151],"four":[152],"distinctive":[153],"categories,":[154],"i.e.,":[155],"safe,":[156],"noise,":[158],"rare,":[159],"outlier.":[161],"Specifically,":[162],"first":[164],"determine":[165],"overlapped":[172],"region":[173],"using":[174,237],"BNF":[176],"method.":[177],"Secondly,":[178],"use":[180],"OBN":[182],"method":[183,242],"detect":[185],"apply":[189],"DBSCAN":[191],"cluster":[194],"samples.":[196,228],"Based":[197],"results":[200],"obtained":[201],"from":[202],"sample":[204],"identification":[205],"analysis,":[206],"then":[208],"segregate":[209],"safe":[211,234],"category":[212],"not":[216],"abnormal":[217],"while":[219],"keeping":[220],"rest":[222],"rare":[227],"Finally,":[229],"remove":[231],"some":[232],"by":[236],"random":[239],"under-sampling":[240],"(RUS)":[241],"verify":[244],"effectiveness":[246],"proposed":[249],"algorithm":[250],"through":[251],"comprehensive":[253],"experimental":[254],"analysis":[255],"considering":[257],"several":[258],"imbalance":[260],"datasets.":[261]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-22T06:13:13.366637","created_date":"2025-10-10T00:00:00"}
