{"id":"https://openalex.org/W3216794305","doi":"https://doi.org/10.1186/s13040-021-00283-6","title":"Gaussian noise up-sampling is better suited than SMOTE and ADASYN for clinical decision making","display_name":"Gaussian noise up-sampling is better suited than SMOTE and ADASYN for clinical decision making","publication_year":2021,"publication_date":"2021-11-29","ids":{"openalex":"https://openalex.org/W3216794305","doi":"https://doi.org/10.1186/s13040-021-00283-6","mag":"3216794305","pmid":"https://pubmed.ncbi.nlm.nih.gov/34844620"},"language":"en","primary_location":{"id":"doi:10.1186/s13040-021-00283-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-021-00283-6","pdf_url":"https://biodatamining.biomedcentral.com/counter/pdf/10.1186/s13040-021-00283-6","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://biodatamining.biomedcentral.com/counter/pdf/10.1186/s13040-021-00283-6","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112984561","display_name":"Jacqueline Michelle Beinecke","orcid":null},"institutions":[{"id":"https://openalex.org/I161103922","display_name":"Philipps University of Marburg","ror":"https://ror.org/01rdrb571","country_code":"DE","type":"education","lineage":["https://openalex.org/I161103922"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Jacqueline Beinecke","raw_affiliation_strings":["Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany","institution_ids":["https://openalex.org/I161103922"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060650201","display_name":"Dominik Heider","orcid":"https://orcid.org/0000-0002-3108-8311"},"institutions":[{"id":"https://openalex.org/I161103922","display_name":"Philipps University of Marburg","ror":"https://ror.org/01rdrb571","country_code":"DE","type":"education","lineage":["https://openalex.org/I161103922"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Dominik Heider","raw_affiliation_strings":["Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany. dominik.heider@uni-marburg.de","Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany"],"raw_orcid":"https://orcid.org/0000-0002-3108-8311","affiliations":[{"raw_affiliation_string":"Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany. dominik.heider@uni-marburg.de","institution_ids":["https://openalex.org/I161103922"]},{"raw_affiliation_string":"Department of Mathematics and Computer Science, Philipps-University of Marburg, Hans-Meerwein-Str. 6, 35043, Marburg, Germany","institution_ids":["https://openalex.org/I161103922"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5112984561"],"corresponding_institution_ids":["https://openalex.org/I161103922"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":5.1794,"has_fulltext":true,"cited_by_count":71,"citation_normalized_percentile":{"value":0.96216046,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"14","issue":"1","first_page":"49","last_page":"49"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11443","display_name":"Advanced Statistical Process Monitoring","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7658474445343018},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5932208895683289},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5692405104637146},{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.562655508518219},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5584556460380554},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.5422455072402954},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5187190175056458},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4750480651855469},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.46173274517059326},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.45196303725242615},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.45174288749694824},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41983214020729065}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7658474445343018},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5932208895683289},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5692405104637146},{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.562655508518219},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5584556460380554},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.5422455072402954},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5187190175056458},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4750480651855469},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.46173274517059326},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.45196303725242615},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.45174288749694824},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41983214020729065},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1186/s13040-021-00283-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-021-00283-6","pdf_url":"https://biodatamining.biomedcentral.com/counter/pdf/10.1186/s13040-021-00283-6","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},{"id":"pmid:34844620","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34844620","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData mining","raw_type":null},{"id":"pmh:oai:doaj.org/article:87bc75d2f5c5416db4f6e104d9286f50","is_oa":true,"landing_page_url":"https://doaj.org/article/87bc75d2f5c5416db4f6e104d9286f50","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BioData Mining, Vol 14, Iss 1, Pp 1-11 (2021)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:8628399","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/8628399","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BioData Min","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13040-021-00283-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-021-00283-6","pdf_url":"https://biodatamining.biomedcentral.com/counter/pdf/10.1186/s13040-021-00283-6","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7900000214576721,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3216794305.pdf","grobid_xml":"https://content.openalex.org/works/W3216794305.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W1505191356","https://openalex.org/W1969557815","https://openalex.org/W2009467617","https://openalex.org/W2035833657","https://openalex.org/W2042762335","https://openalex.org/W2058203033","https://openalex.org/W2064186732","https://openalex.org/W2091469633","https://openalex.org/W2104551758","https://openalex.org/W2104933073","https://openalex.org/W2110065044","https://openalex.org/W2136362180","https://openalex.org/W2143684265","https://openalex.org/W2144798162","https://openalex.org/W2145126338","https://openalex.org/W2148143831","https://openalex.org/W2157963336","https://openalex.org/W2335024046","https://openalex.org/W2338318698","https://openalex.org/W2402601207","https://openalex.org/W2470965540","https://openalex.org/W2490420619","https://openalex.org/W2540642777","https://openalex.org/W2550614318","https://openalex.org/W2612932006","https://openalex.org/W2620511244","https://openalex.org/W2760946358","https://openalex.org/W2798891231","https://openalex.org/W2902872384","https://openalex.org/W2920054351","https://openalex.org/W2949479579","https://openalex.org/W2969756003","https://openalex.org/W2986698571","https://openalex.org/W2998793733","https://openalex.org/W2999309192","https://openalex.org/W3024473672","https://openalex.org/W3120740533","https://openalex.org/W4231669957","https://openalex.org/W4256078332"],"related_works":["https://openalex.org/W2181530120","https://openalex.org/W4211215373","https://openalex.org/W2024529227","https://openalex.org/W1574575415","https://openalex.org/W3144172081","https://openalex.org/W3028371478","https://openalex.org/W2081476516","https://openalex.org/W2581984549","https://openalex.org/W3179858851","https://openalex.org/W3123177881"],"abstract_inverted_index":{"Clinical":[0],"data":[1,65,72,85],"sets":[2,73,86],"have":[3,21,34,60],"very":[4],"special":[5],"properties":[6],"and":[7,27,33,41,67,87,112,114],"suffer":[8],"from":[9],"many":[10],"caveats":[11],"in":[12,83,135],"machine":[13,91],"learning.":[14],"They":[15],"typically":[16,52],"show":[17],"a":[18,22,28],"high-class":[19],"imbalance,":[20],"small":[23],"number":[24,30],"of":[25,31,90],"samples":[26],"large":[29],"parameters,":[32],"missing":[35],"values.":[36],"While":[37],"feature":[38],"selection":[39],"approaches":[40],"imputation":[42],"techniques":[43,59,80],"address":[44],"the":[45,48],"former":[46],"problems,":[47],"class":[49],"imbalance":[50],"is":[51,74,102,107],"addressed":[53],"using":[54],"augmentation":[55,79,128],"techniques.":[56],"However,":[57,121],"these":[58],"been":[61,125],"developed":[62],"for":[63,70,81],"big":[64],"analytics,":[66],"their":[68],"suitability":[69],"clinical":[71,84],"unclear.This":[75],"study":[76],"analyzed":[77],"different":[78],"use":[82],"subsequent":[88],"employment":[89],"learning-based":[92],"classification.":[93],"It":[94],"turns":[95],"out":[96],"that":[97,127],"Gaussian":[98],"Noise":[99],"Up-Sampling":[100],"(GNUS)":[101],"not":[103,130],"always":[104],"but":[105],"generally,":[106],"as":[108,110],"good":[109],"SMOTE":[111],"ADASYN":[113],"even":[115],"outperform":[116],"those":[117],"on":[118],"some":[119,136],"datasets.":[120],"it":[122],"has":[123],"also":[124],"shown":[126],"does":[129],"improve":[131],"classification":[132],"at":[133],"all":[134],"cases.":[137]},"counts_by_year":[{"year":2026,"cited_by_count":12},{"year":2025,"cited_by_count":22},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":17},{"year":2022,"cited_by_count":7}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
