{"id":"https://openalex.org/W4322500535","doi":"https://doi.org/10.3390/data8030049","title":"Data Balancing Techniques for Predicting Student Dropout Using Machine Learning","display_name":"Data Balancing Techniques for Predicting Student Dropout Using Machine Learning","publication_year":2023,"publication_date":"2023-02-27","ids":{"openalex":"https://openalex.org/W4322500535","doi":"https://doi.org/10.3390/data8030049"},"language":"en","primary_location":{"id":"doi:10.3390/data8030049","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8030049","pdf_url":"https://www.mdpi.com/2306-5729/8/3/49/pdf?version=1677481724","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2306-5729/8/3/49/pdf?version=1677481724","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035585798","display_name":"Neema Mduma","orcid":"https://orcid.org/0000-0002-4364-3124"},"institutions":[{"id":"https://openalex.org/I97231232","display_name":"Nelson Mandela African Institution of Science and Technology","ror":"https://ror.org/041vsn055","country_code":"TZ","type":"education","lineage":["https://openalex.org/I97231232"]}],"countries":["TZ"],"is_corresponding":true,"raw_author_name":"Neema Mduma","raw_affiliation_strings":["Department of Information and Communication Sciences and Engineering, The Nelson Mandela African Institution of Science and Technology, Arusha P.O. Box 447, Tanzania"],"raw_orcid":"https://orcid.org/0000-0002-4364-3124","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Sciences and Engineering, The Nelson Mandela African Institution of Science and Technology, Arusha P.O. Box 447, Tanzania","institution_ids":["https://openalex.org/I97231232"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5035585798"],"corresponding_institution_ids":["https://openalex.org/I97231232"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":7.6684,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.97952464,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"8","issue":"3","first_page":"49","last_page":"49"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.8273178339004517},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7155249118804932},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.6521407961845398},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.617381751537323},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6080198287963867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5920842289924622},{"id":"https://openalex.org/keywords/confusion-matrix","display_name":"Confusion matrix","score":0.5458621382713318},{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.48757094144821167},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3897019028663635},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.13452032208442688}],"concepts":[{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.8273178339004517},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7155249118804932},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.6521407961845398},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.617381751537323},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6080198287963867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5920842289924622},{"id":"https://openalex.org/C138602881","wikidata":"https://www.wikidata.org/wiki/Q2709591","display_name":"Confusion matrix","level":2,"score":0.5458621382713318},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.48757094144821167},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3897019028663635},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.13452032208442688}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/data8030049","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8030049","pdf_url":"https://www.mdpi.com/2306-5729/8/3/49/pdf?version=1677481724","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:gam:jdataj:v:8:y:2023:i:3:p:49-:d:1081633","is_oa":false,"landing_page_url":"https://www.mdpi.com/2306-5729/8/3/49/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:doaj.org/article:1ad7ee21f2df4b0e866a0d26fe633c9c","is_oa":true,"landing_page_url":"https://doaj.org/article/1ad7ee21f2df4b0e866a0d26fe633c9c","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data, Vol 8, Iss 3, p 49 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2306-5729/8/3/49/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/data8030049","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/data8030049","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8030049","pdf_url":"https://www.mdpi.com/2306-5729/8/3/49/pdf?version=1677481724","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6700000166893005,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4322500535.pdf"},"referenced_works_count":74,"referenced_works":["https://openalex.org/W1190947359","https://openalex.org/W1477378514","https://openalex.org/W1623006543","https://openalex.org/W1873332500","https://openalex.org/W1959220275","https://openalex.org/W1982165141","https://openalex.org/W1993220166","https://openalex.org/W2013272253","https://openalex.org/W2034213054","https://openalex.org/W2040181375","https://openalex.org/W2058703365","https://openalex.org/W2067594023","https://openalex.org/W2069992838","https://openalex.org/W2095148636","https://openalex.org/W2103647733","https://openalex.org/W2104961002","https://openalex.org/W2120457925","https://openalex.org/W2128965734","https://openalex.org/W2130226478","https://openalex.org/W2149024119","https://openalex.org/W2154706222","https://openalex.org/W2162847938","https://openalex.org/W2164330572","https://openalex.org/W2216326501","https://openalex.org/W2216946510","https://openalex.org/W2238013688","https://openalex.org/W2295797531","https://openalex.org/W2321367626","https://openalex.org/W2338318698","https://openalex.org/W2415567294","https://openalex.org/W2476492714","https://openalex.org/W2514579206","https://openalex.org/W2529456000","https://openalex.org/W2533824555","https://openalex.org/W2546314413","https://openalex.org/W2582482077","https://openalex.org/W2588330427","https://openalex.org/W2589697858","https://openalex.org/W2592955949","https://openalex.org/W2605782971","https://openalex.org/W2606494063","https://openalex.org/W2740912294","https://openalex.org/W2743917483","https://openalex.org/W2744032228","https://openalex.org/W2760894977","https://openalex.org/W2762332651","https://openalex.org/W2772393799","https://openalex.org/W2775539418","https://openalex.org/W2793643126","https://openalex.org/W2799963283","https://openalex.org/W2903515276","https://openalex.org/W2908355237","https://openalex.org/W2912892963","https://openalex.org/W2915981391","https://openalex.org/W2962807382","https://openalex.org/W2963100393","https://openalex.org/W2986698571","https://openalex.org/W2997276923","https://openalex.org/W3003555941","https://openalex.org/W3085957330","https://openalex.org/W4223944868","https://openalex.org/W4307948039","https://openalex.org/W4309284738","https://openalex.org/W6636749155","https://openalex.org/W6639175750","https://openalex.org/W6690128647","https://openalex.org/W6697339809","https://openalex.org/W6719844942","https://openalex.org/W6733989970","https://openalex.org/W6736817506","https://openalex.org/W6746590627","https://openalex.org/W6757935464","https://openalex.org/W6759495822","https://openalex.org/W6941537234"],"related_works":["https://openalex.org/W4239706975","https://openalex.org/W4321636153","https://openalex.org/W4379742641","https://openalex.org/W2765947158","https://openalex.org/W3198710639","https://openalex.org/W4308191010","https://openalex.org/W4283313480","https://openalex.org/W4323021782","https://openalex.org/W4231994957","https://openalex.org/W4293525103"],"abstract_inverted_index":{"Predicting":[0],"student":[1,18],"dropout":[2,19,35,160,198],"is":[3,12,28],"a":[4,38,73],"challenging":[5],"problem":[6],"in":[7,17,67],"the":[8,23,32,42,68,124,142,147,156,164,170,174,178,188,195],"education":[9],"sector.":[10],"This":[11],"due":[13],"to":[14,50,63,122],"an":[15,51],"imbalance":[16,44],"data,":[20],"mainly":[21],"because":[22],"number":[24,33,158],"of":[25,34,126,159,183,191,197],"registered":[26],"students":[27,161,193],"always":[29],"higher":[30],"than":[31],"students.":[36],"Developing":[37],"model":[39],"without":[40],"taking":[41],"data":[43,58],"issue":[45],"into":[46],"account":[47],"may":[48],"lead":[49],"ungeneralized":[52],"model.":[53],"In":[54],"this":[55],"study,":[56],"different":[57],"balancing":[59,127],"techniques":[60,128],"were":[61,98,120],"applied":[62],"improve":[64],"prediction":[65,130,190],"accuracy":[66],"minority":[69],"class":[70],"while":[71],"maintaining":[72],"satisfactory":[74],"overall":[75],"classification":[76,104,144],"performance.":[77],"Random":[78,81,108],"Over":[79,86],"Sampling,":[80,83,87],"Under":[82],"Synthetic":[84],"Minority":[85],"SMOTE":[88,94,136],"with":[89,95,101,137],"Edited":[90,138],"Nearest":[91,139],"Neighbor":[92,140],"and":[93,110,118,129,167,194],"Tomek":[96],"links":[97],"tested,":[99],"along":[100],"three":[102],"popular":[103],"models:":[105],"Logistic":[106,152],"Regression,":[107],"Forest,":[109],"Multi-Layer":[111],"Perceptron.":[112],"Publicly":[113],"accessible":[114],"datasets":[115],"from":[116],"Tanzania":[117],"India":[119,171],"used":[121],"evaluate":[123],"effectiveness":[125],"models.":[131],"The":[132,181],"results":[133],"indicate":[134],"that":[135],"achieved":[141],"best":[143],"performance":[145],"on":[146],"10-fold":[148],"holdout":[149],"sample.":[150],"Furthermore,":[151],"Regression":[153],"correctly":[154],"classified":[155],"largest":[157],"(57348":[162],"for":[163,169,187],"Uwezo":[165],"dataset":[166],"13430":[168],"dataset)":[172],"using":[173],"confusion":[175],"matrix":[176],"as":[177],"evaluation":[179],"matrix.":[180],"applications":[182],"these":[184],"models":[185],"allow":[186],"precise":[189],"at-risk":[192],"reduction":[196],"rates.":[199]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":5}],"updated_date":"2025-12-30T23:08:21.542490","created_date":"2025-10-10T00:00:00"}
