{"id":"https://openalex.org/W1987860477","doi":"https://doi.org/10.1109/bigcomp.2014.6741439","title":"A new sampling approach for classification of imbalanced data sets with high density","display_name":"A new sampling approach for classification of imbalanced data sets with high density","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W1987860477","doi":"https://doi.org/10.1109/bigcomp.2014.6741439","mag":"1987860477"},"language":"en","primary_location":{"id":"doi:10.1109/bigcomp.2014.6741439","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp.2014.6741439","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 International Conference on Big Data and Smart Computing (BIGCOMP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101998565","display_name":"Pengfei Jia","orcid":"https://orcid.org/0000-0002-9569-6332"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jia Pengfei","raw_affiliation_strings":["Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012559241","display_name":"Chunkai Zhang","orcid":"https://orcid.org/0000-0002-2207-0953"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhang Chunkai","raw_affiliation_strings":["Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100740564","display_name":"Zhenyu He","orcid":"https://orcid.org/0000-0002-2546-8721"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"He Zhenyu","raw_affiliation_strings":["Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Graduate School, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Shenzhen Grad. Sch., Harbin Inst. of Technol., Shenzhen, , China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101998565"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":4.2412,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.94277622,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"217","last_page":"222"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9413999915122986,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9193000197410583,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/oversampling","display_name":"Oversampling","score":0.7411333322525024},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7179691195487976},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6539416313171387},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6340261101722717},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5698720216751099},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5383838415145874},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.49078449606895447},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4690333604812622},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4672028720378876},{"id":"https://openalex.org/keywords/statistical-classification","display_name":"Statistical classification","score":0.44814205169677734},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4382956027984619},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4360281527042389},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.15121972560882568}],"concepts":[{"id":"https://openalex.org/C197323446","wikidata":"https://www.wikidata.org/wiki/Q331222","display_name":"Oversampling","level":3,"score":0.7411333322525024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7179691195487976},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6539416313171387},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6340261101722717},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5698720216751099},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5383838415145874},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.49078449606895447},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4690333604812622},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4672028720378876},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.44814205169677734},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4382956027984619},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4360281527042389},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.15121972560882568},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigcomp.2014.6741439","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp.2014.6741439","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 International Conference on Big Data and Smart Computing (BIGCOMP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/1","display_name":"No poverty","score":0.6200000047683716}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W47312375","https://openalex.org/W85350352","https://openalex.org/W167016754","https://openalex.org/W1563938718","https://openalex.org/W1570448133","https://openalex.org/W1588282782","https://openalex.org/W1707341581","https://openalex.org/W1766594731","https://openalex.org/W1980894113","https://openalex.org/W2017416182","https://openalex.org/W2023639956","https://openalex.org/W2046384674","https://openalex.org/W2099454382","https://openalex.org/W2117689108","https://openalex.org/W2118978333","https://openalex.org/W2132791018","https://openalex.org/W2133990480","https://openalex.org/W2148143831","https://openalex.org/W2158698691","https://openalex.org/W2464091921","https://openalex.org/W2979832949","https://openalex.org/W3120740533","https://openalex.org/W3155649056","https://openalex.org/W4230683138","https://openalex.org/W6603460400","https://openalex.org/W6606837198","https://openalex.org/W6633571703","https://openalex.org/W6637352407","https://openalex.org/W6679745481","https://openalex.org/W6719283829"],"related_works":["https://openalex.org/W3196098778","https://openalex.org/W3172259201","https://openalex.org/W3211250490","https://openalex.org/W2903618681","https://openalex.org/W3184937791","https://openalex.org/W4360584310","https://openalex.org/W2981515171","https://openalex.org/W80466363","https://openalex.org/W2924282518","https://openalex.org/W3080872054"],"abstract_inverted_index":{"Class":[0],"imbalance":[1],"of":[2,11,54,66,98],"datasets":[3],"is":[4],"a":[5,45,142],"common":[6],"problem":[7],"in":[8,34,58,121,156],"the":[9,18,41,52,68,85,109,113,122,168,172],"field":[10],"machine":[12],"learning.":[13],"In":[14],"recent":[15],"years,":[16],"because":[17],"traditional":[19],"classifier":[20],"algorithms":[21,104,139],"are":[22,80,105],"designed":[23],"only":[24,107],"for":[25,40,84,92],"balanced":[26],"cases,":[27],"these":[28,137],"classifiers":[29],"always":[30],"achieved":[31],"poor":[32],"performance":[33,144],"imbalanced":[35,42,55,69,86],"data":[36,43,56,70,87,94],"classification":[37,57,71],"issues,":[38],"especially":[39,91],"with":[44,88,95],"really":[46],"high":[47,89],"density.":[48],"This":[49],"paper":[50],"introduces":[51],"importance":[53],"various":[59],"fields":[60],"first;":[61],"then,":[62],"contends":[63],"existing":[64],"methods":[65],"solving":[67],"problem;":[72],"finally,":[73],"proposes":[74],"two":[75,102,138],"new":[76,103],"sampling":[77,169],"methods,":[78],"which":[79],"based":[81],"on":[82],"borderline-SMOTE,":[83],"density,":[90],"big":[93],"this":[96],"kind":[97],"distribution":[99],"feature.":[100],"These":[101],"not":[106],"over-sampling":[108,152],"minority":[110,151,176],"samples":[111,120,125,178],"near":[112],"borderline,":[114],"but":[115],"also":[116],"creating":[117],"appropriate":[118],"synthetic":[119],"majority":[123,131,173],"class":[124,132,174,177],"side":[126],"and":[127,154,175],"under-sampling":[128],"some":[129],"particular":[130],"samples.":[133],"Experiments":[134],"show":[135],"that":[136],"could":[140],"achieve":[141],"better":[143],"than":[145],"random":[146],"over":[147],"sampling,":[148],"SMOTE":[149],"(Synthetic":[150],"technique)":[153],"Borderline-SMOTE":[155],"AUC":[157],"(Area":[158],"under":[159],"Receiver":[160],"Operating":[161],"Characteristics":[162],"Curve)":[163],"metric":[164],"evaluate":[165],"method,":[166],"when":[167],"rate":[170],"makes":[171],"approximate":[179],"equilibrium.":[180]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2014,"cited_by_count":1}],"updated_date":"2026-03-17T09:09:15.849793","created_date":"2025-10-10T00:00:00"}
