{"id":"https://openalex.org/W4389574468","doi":"https://doi.org/10.3390/a16120563","title":"On the Influence of Data Imbalance on Supervised Gaussian Mixture Models","display_name":"On the Influence of Data Imbalance on Supervised Gaussian Mixture Models","publication_year":2023,"publication_date":"2023-12-11","ids":{"openalex":"https://openalex.org/W4389574468","doi":"https://doi.org/10.3390/a16120563"},"language":"en","primary_location":{"id":"doi:10.3390/a16120563","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16120563","pdf_url":"https://www.mdpi.com/1999-4893/16/12/563/pdf?version=1702296656","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1999-4893/16/12/563/pdf?version=1702296656","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045808844","display_name":"Luca Scrucca","orcid":"https://orcid.org/0000-0003-3826-0484"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Luca Scrucca","raw_affiliation_strings":["Department of Economics, Universit\u00e0 degli Studi di Perugia, Via A. Pascoli 20, 06123 Perugia, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Economics, Universit\u00e0 degli Studi di Perugia, Via A. Pascoli 20, 06123 Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5045808844"],"corresponding_institution_ids":["https://openalex.org/I27483092"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.3485,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67284153,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"16","issue":"12","first_page":"563","last_page":"563"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9697999954223633,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7485079765319824},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.7269635200500488},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6254463791847229},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.6038472056388855},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5969327688217163},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5862695574760437},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5230101943016052},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.44295957684516907},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33857885003089905},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.09631222486495972}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7485079765319824},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7269635200500488},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6254463791847229},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.6038472056388855},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5969327688217163},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5862695574760437},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5230101943016052},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.44295957684516907},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33857885003089905},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.09631222486495972},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/a16120563","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16120563","pdf_url":"https://www.mdpi.com/1999-4893/16/12/563/pdf?version=1702296656","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},{"id":"pmh:oai:cris.unibo.it:11585/1001384","is_oa":true,"landing_page_url":"https://hdl.handle.net/11585/1001384","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:doaj.org/article:a587dab857fa4ab5a954f98ca50e2b6d","is_oa":true,"landing_page_url":"https://doaj.org/article/a587dab857fa4ab5a954f98ca50e2b6d","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms, Vol 16, Iss 12, p 563 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/a16120563","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16120563","pdf_url":"https://www.mdpi.com/1999-4893/16/12/563/pdf?version=1702296656","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4389574468.pdf"},"referenced_works_count":18,"referenced_works":["https://openalex.org/W1614659291","https://openalex.org/W2005363197","https://openalex.org/W2011832962","https://openalex.org/W2015452969","https://openalex.org/W2049633694","https://openalex.org/W2117190680","https://openalex.org/W2141253686","https://openalex.org/W2148143831","https://openalex.org/W2168175751","https://openalex.org/W2488678869","https://openalex.org/W2498094064","https://openalex.org/W2519132385","https://openalex.org/W2610549282","https://openalex.org/W2943917172","https://openalex.org/W4231665431","https://openalex.org/W4243367342","https://openalex.org/W4328105806","https://openalex.org/W6631885290"],"related_works":["https://openalex.org/W2990323019","https://openalex.org/W2014494654","https://openalex.org/W3130349901","https://openalex.org/W1579833936","https://openalex.org/W2095350775","https://openalex.org/W1952261593","https://openalex.org/W2115713555","https://openalex.org/W2014842417","https://openalex.org/W2064901931","https://openalex.org/W1578916557"],"abstract_inverted_index":{"Imbalanced":[0],"data":[1,59],"present":[2],"a":[3,50],"pervasive":[4],"challenge":[5],"in":[6,42,111,122],"many":[7],"real-world":[8,90],"applications":[9],"of":[10,18,24,32,38,57,65,96],"statistical":[11],"and":[12,45,63,81,89,120],"machine":[13],"learning,":[14,78],"where":[15],"the":[16,25,30,36,47,54,61,94,102],"instances":[17],"one":[19],"class":[20,33,109],"significantly":[21],"outnumber":[22],"those":[23],"other.":[26],"This":[27],"paper":[28],"examines":[29],"impact":[31],"imbalance":[34,110],"on":[35,60,87],"performance":[37],"Gaussian":[39,113],"mixture":[40],"models":[41],"classification":[43,66,124],"tasks":[44],"establishes":[46],"need":[48,103],"for":[49,104,108,118],"strategy":[51],"to":[52,72],"reduce":[53],"adverse":[55],"effects":[56],"imbalanced":[58],"accuracy":[62],"reliability":[64],"outcomes.":[67,125],"We":[68],"explore":[69],"various":[70],"strategies":[71,107],"address":[73],"this":[74],"problem,":[75],"including":[76],"cost-sensitive":[77],"threshold":[79],"adjustments,":[80],"sampling-based":[82],"techniques.":[83],"Through":[84],"extensive":[85],"experiments":[86],"synthetic":[88],"datasets,":[91],"we":[92],"evaluate":[93],"effectiveness":[95],"these":[97],"methods.":[98],"Our":[99],"findings":[100],"emphasize":[101],"effective":[105],"mitigation":[106],"supervised":[112],"mixtures,":[114],"offering":[115],"valuable":[116],"insights":[117],"practitioners":[119],"researchers":[121],"improving":[123]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-02-28T09:26:25.869077","created_date":"2025-10-10T00:00:00"}
