{"id":"https://openalex.org/W4293102791","doi":"https://doi.org/10.1080/03610918.2022.2049820","title":"A virtual multi-label approach to imbalanced data classification","display_name":"A virtual multi-label approach to imbalanced data classification","publication_year":2022,"publication_date":"2022-03-21","ids":{"openalex":"https://openalex.org/W4293102791","doi":"https://doi.org/10.1080/03610918.2022.2049820"},"language":"en","primary_location":{"id":"doi:10.1080/03610918.2022.2049820","is_oa":false,"landing_page_url":"https://doi.org/10.1080/03610918.2022.2049820","pdf_url":null,"source":{"id":"https://openalex.org/S153329750","display_name":"Communications in Statistics - Simulation and Computation","issn_l":"0361-0918","issn":["0361-0918","1532-4141"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Statistics - Simulation and Computation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083300026","display_name":"Elizabeth P. Chou","orcid":"https://orcid.org/0000-0002-8983-142X"},"institutions":[{"id":"https://openalex.org/I87354575","display_name":"National Chengchi University","ror":"https://ror.org/03rqk8h36","country_code":"TW","type":"education","lineage":["https://openalex.org/I87354575"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Elizabeth P. Chou","raw_affiliation_strings":["Department of Statistics, National Chengchi University, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Statistics, National Chengchi University, Taipei, Taiwan","institution_ids":["https://openalex.org/I87354575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002621818","display_name":"Shan\u2010Ping Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I87354575","display_name":"National Chengchi University","ror":"https://ror.org/03rqk8h36","country_code":"TW","type":"education","lineage":["https://openalex.org/I87354575"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shan-Ping Yang","raw_affiliation_strings":["Department of Statistics, National Chengchi University, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Statistics, National Chengchi University, Taipei, Taiwan","institution_ids":["https://openalex.org/I87354575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5083300026"],"corresponding_institution_ids":["https://openalex.org/I87354575"],"apc_list":null,"apc_paid":null,"fwci":0.2758,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.62511489,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"53","issue":"3","first_page":"1461","last_page":"1471"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/undersampling","display_name":"Undersampling","score":0.9442859888076782},{"id":"https://openalex.org/keywords/oversampling","display_name":"Oversampling","score":0.8778888583183289},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7861850261688232},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.7398925423622131},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7323552370071411},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.702277660369873},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5477655529975891},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5344765782356262},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5180140137672424},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5151099562644958},{"id":"https://openalex.org/keywords/multiclass-classification","display_name":"Multiclass classification","score":0.4344814419746399},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.418854296207428},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.41425585746765137},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4097583293914795},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3463558256626129},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.1914268434047699},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.07854366302490234}],"concepts":[{"id":"https://openalex.org/C136536468","wikidata":"https://www.wikidata.org/wiki/Q1225894","display_name":"Undersampling","level":2,"score":0.9442859888076782},{"id":"https://openalex.org/C197323446","wikidata":"https://www.wikidata.org/wiki/Q331222","display_name":"Oversampling","level":3,"score":0.8778888583183289},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7861850261688232},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7398925423622131},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7323552370071411},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.702277660369873},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5477655529975891},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5344765782356262},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5180140137672424},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5151099562644958},{"id":"https://openalex.org/C123860398","wikidata":"https://www.wikidata.org/wiki/Q6934605","display_name":"Multiclass classification","level":3,"score":0.4344814419746399},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.418854296207428},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.41425585746765137},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4097583293914795},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3463558256626129},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.1914268434047699},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.07854366302490234},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1080/03610918.2022.2049820","is_oa":false,"landing_page_url":"https://doi.org/10.1080/03610918.2022.2049820","pdf_url":null,"source":{"id":"https://openalex.org/S153329750","display_name":"Communications in Statistics - Simulation and Computation","issn_l":"0361-0918","issn":["0361-0918","1532-4141"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Statistics - Simulation and Computation","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G434435203","display_name":null,"funder_award_id":"-M-004-004","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G737106015","display_name":null,"funder_award_id":"MOST 108-","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"}],"funders":[{"id":"https://openalex.org/F4320322795","display_name":"Ministry of Science and Technology, Taiwan","ror":"https://ror.org/02kv4zf79"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W728297","https://openalex.org/W102369970","https://openalex.org/W1499292107","https://openalex.org/W1986703974","https://openalex.org/W1992795012","https://openalex.org/W2053724458","https://openalex.org/W2104167780","https://openalex.org/W2109826612","https://openalex.org/W2118978333","https://openalex.org/W2132870739","https://openalex.org/W2135046866","https://openalex.org/W2150593711","https://openalex.org/W2154706222","https://openalex.org/W2244476846","https://openalex.org/W2299467264","https://openalex.org/W2551233626","https://openalex.org/W3037850413","https://openalex.org/W3144619878","https://openalex.org/W4239510810"],"related_works":["https://openalex.org/W32988189","https://openalex.org/W4389233021","https://openalex.org/W4308469503","https://openalex.org/W2904737874","https://openalex.org/W80466363","https://openalex.org/W2399571531","https://openalex.org/W2947132063","https://openalex.org/W4390415670","https://openalex.org/W4288337828","https://openalex.org/W4287816717"],"abstract_inverted_index":{"One":[0],"of":[1,17,64,79,85,96,117,134,210],"the":[2,49,83,92,115,140,146,153,162,170,202,208],"most":[3],"challenging":[4],"issues":[5],"in":[6,14,48,53,169],"machine":[7,33],"learning":[8,34,39,57],"is":[9,23,94,149,167,175],"imbalanced":[10,154],"data":[11,211],"analysis.":[12],"Usually,":[13],"this":[15,138],"type":[16],"research,":[18],"correctly":[19,27],"predicting":[20,28],"minority":[21],"labels":[22,142],"more":[24],"critical":[25],"than":[26],"majority":[29,50,147],"labels.":[30],"However,":[31],"traditional":[32],"techniques":[35],"easily":[36],"lead":[37],"to":[38,44,90,131,151],"bias.":[40],"Traditional":[41],"classifiers":[42],"tend":[43],"place":[45],"all":[46,132],"subjects":[47],"group,":[51],"resulting":[52],"biased":[54],"predictions.":[55],"Machine":[56],"studies":[58],"are":[59,77],"typically":[60],"conducted":[61],"from":[62],"one":[63],"two":[65],"perspectives:":[66],"a":[67,71,97],"data-based":[68,80],"perspective":[69],"or":[70,88],"model-based":[72,98],"perspective.":[73],"Oversampling":[74],"and":[75,120,189,191,195,214],"undersampling":[76],"examples":[78],"approaches,":[81],"while":[82],"addition":[84],"costs,":[86],"penalties,":[87],"weights":[89],"optimize":[91],"algorithm":[93],"typical":[95],"approach.":[99],"Some":[100],"ensemble":[101],"methods":[102,108,127,186,193],"have":[103],"been":[104],"studied":[105],"recently.":[106],"These":[107],"cause":[109],"various":[110],"problems,":[111],"such":[112,183],"as":[113,184],"overfitting,":[114],"omission":[116],"some":[118],"information,":[119],"long":[121],"computation":[122],"times.":[123],"In":[124],"addition,":[125],"these":[126],"do":[128],"not":[129],"apply":[130],"kinds":[133],"datasets.":[135],"Based":[136],"on":[137],"problem,":[139],"virtual":[141],"(ViLa)":[143],"approach":[144,160],"for":[145],"label":[148],"proposed":[150,173,203],"solve":[152],"problem.":[155],"A":[156],"new":[157],"multiclass":[158],"classification":[159],"with":[161,177],"equal":[163],"K-means":[164],"clustering":[165],"method":[166,174,204],"demonstrated":[168],"study.":[171],"The":[172,198],"compared":[176],"commonly":[178],"used":[179],"imbalance":[180,212],"problem":[181],"methods,":[182],"sampling":[185],"(oversampling,":[187],"undersampling,":[188],"SMOTE)":[190],"classifier":[192],"(SVM":[194],"one-class":[196],"SVM).":[197],"results":[199],"show":[200],"that":[201],"performs":[205],"better":[206],"when":[207],"degree":[209],"increases":[213],"will":[215],"gradually":[216],"outperform":[217],"other":[218],"methods.":[219]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
