{"id":"https://openalex.org/W7124159279","doi":"https://doi.org/10.1145/3777577.3777583","title":"Towards Data-Driven Chronic Disease Prevention: Interpretable Machine Learning Models for Diabetes Risk Screening","display_name":"Towards Data-Driven Chronic Disease Prevention: Interpretable Machine Learning Models for Diabetes Risk Screening","publication_year":2025,"publication_date":"2025-10-24","ids":{"openalex":"https://openalex.org/W7124159279","doi":"https://doi.org/10.1145/3777577.3777583"},"language":null,"primary_location":{"id":"doi:10.1145/3777577.3777583","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3777577.3777583","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 6th International Symposium on Artificial Intelligence for Medical Sciences","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3777577.3777583","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077194123","display_name":"Yuejia Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuejia Wang","raw_affiliation_strings":["School of International Tourism and Public Management, Hainan University, Haikou, Hainan, China"],"affiliations":[{"raw_affiliation_string":"School of International Tourism and Public Management, Hainan University, Haikou, Hainan, China","institution_ids":["https://openalex.org/I20942203"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5077194123"],"corresponding_institution_ids":["https://openalex.org/I20942203"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.77285387,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"37","last_page":"44"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9132999777793884,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9132999777793884,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.019300000742077827,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.004800000227987766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.635200023651123},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4869000017642975},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4745999872684479},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.4366999864578247},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.4311999976634979},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3921999931335449},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.37529999017715454},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.3653999865055084}],"concepts":[{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.8555999994277954},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7731999754905701},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.635200023651123},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5259000062942505},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4869000017642975},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4745999872684479},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.4366999864578247},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.4311999976634979},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3921999931335449},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.37529999017715454},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.3653999865055084},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.3440000116825104},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.33469998836517334},{"id":"https://openalex.org/C555293320","wikidata":"https://www.wikidata.org/wiki/Q12206","display_name":"Diabetes mellitus","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C2780665704","wikidata":"https://www.wikidata.org/wiki/Q959298","display_name":"Intervention (counseling)","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.3208000063896179},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.31029999256134033},{"id":"https://openalex.org/C29825287","wikidata":"https://www.wikidata.org/wiki/Q1427940","display_name":"Warning system","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3037000000476837},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.29109999537467957},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2624000012874603},{"id":"https://openalex.org/C2987552334","wikidata":"https://www.wikidata.org/wiki/Q383126","display_name":"Chronic disease","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C138816342","wikidata":"https://www.wikidata.org/wiki/Q189603","display_name":"Public health","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3777577.3777583","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3777577.3777583","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 6th International Symposium on Artificial Intelligence for Medical Sciences","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3777577.3777583","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3777577.3777583","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 6th International Symposium on Artificial Intelligence for Medical Sciences","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W11436880","https://openalex.org/W2005223325","https://openalex.org/W2021242304","https://openalex.org/W2033590944","https://openalex.org/W2487898712","https://openalex.org/W2748084541","https://openalex.org/W2886677972","https://openalex.org/W2891066988","https://openalex.org/W2948811059","https://openalex.org/W2964087226","https://openalex.org/W2990140544","https://openalex.org/W3019449433","https://openalex.org/W3086465290","https://openalex.org/W3131858067","https://openalex.org/W3179092643","https://openalex.org/W3205154869","https://openalex.org/W4200026682","https://openalex.org/W4205802501","https://openalex.org/W4213156113","https://openalex.org/W4225883733","https://openalex.org/W4377093409","https://openalex.org/W4380987982","https://openalex.org/W4385637657","https://openalex.org/W4387215325","https://openalex.org/W4387425289","https://openalex.org/W4388095729","https://openalex.org/W4391093163","https://openalex.org/W4391166814"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,5,43,76,123,148,179,190,197,211],"continuous":[2],"rise":[3],"in":[4,9,24,35,115,128,171,184,196],"incidence":[6],"of":[7,45,130,181,193,200,213],"diabetes":[8,116,185],"recent":[10],"years,":[11],"establishing":[12],"efficient":[13],"and":[14,28,39,48,66,107,134,141,164,207,217],"accurate":[15],"early":[16],"prediction":[17,172,186],"models":[18],"has":[19],"become":[20],"a":[21,56,168,204],"key":[22,64],"task":[23],"chronic":[25],"disease":[26,214],"prevention":[27],"control.":[29],"Traditional":[30],"statistical":[31],"methods":[32],"face":[33],"limitations":[34],"capturing":[36],"nonlinear":[37],"features":[38],"complex":[40],"interactions,":[41],"necessitating":[42],"adoption":[44],"more":[46],"adaptive":[47],"predictive":[49],"machine":[50,90,194],"learning":[51,91,183,195],"approaches.":[52],"This":[53,174],"study":[54,175],"utilizes":[55],"publicly":[57],"available":[58],"health":[59],"dataset":[60],"from":[61,69],"Kaggle,":[62],"selecting":[63],"clinical":[65],"lifestyle":[67],"indicators":[68],"86,480":[70],"samples.":[71],"To":[72,144],"address":[73],"data":[74,84],"imbalance,":[75],"SMOTE":[77],"method":[78,150],"is":[79,151],"applied,":[80],"followed":[81],"by":[82],"standardized":[83],"processing.":[85],"On":[86],"this":[87],"basis,":[88],"eight":[89],"models\u2014including":[92],"Random":[93],"Forest,":[94],"Logistic":[95],"Regression,":[96],"Support":[97],"Vector":[98],"Machine,":[99],"K-Nearest":[100],"Neighbors,":[101],"Na\u00efve":[102],"Bayes,":[103],"Multilayer":[104],"Perceptron,":[105],"XGBoost,":[106],"LightGBM\u2014are":[108],"constructed":[109],"to":[110],"systematically":[111],"compare":[112],"their":[113],"performance":[114],"prediction.":[117],"The":[118],"experimental":[119],"results":[120],"show":[121],"that":[122],"XGBoost":[124],"model":[125,146],"outperforms":[126],"others":[127],"terms":[129],"accuracy,":[131],"precision,":[132],"recall,":[133],"F1":[135],"score,":[136],"demonstrating":[137],"excellent":[138],"generalization":[139],"capability":[140],"practical":[142],"value.":[143],"enhance":[145],"transparency,":[147],"SHAP":[149],"further":[152],"employed":[153],"for":[154,210],"feature":[155],"interpretation,":[156],"identifying":[157],"variables":[158],"such":[159],"as":[160,166],"HbA1c,":[161],"fasting":[162],"glucose,":[163],"BMI":[165],"playing":[167],"critical":[169],"role":[170],"outcomes.":[173],"not":[176],"only":[177],"verifies":[178],"effectiveness":[180],"ensemble":[182],"but":[187],"also":[188],"demonstrates":[189],"application":[191],"prospects":[192],"intelligent":[198],"development":[199],"public":[201],"health,":[202],"providing":[203],"theoretical":[205],"basis":[206],"technical":[208],"support":[209],"construction":[212],"warning":[215],"systems":[216],"individualized":[218],"intervention":[219],"strategies.":[220]},"counts_by_year":[],"updated_date":"2026-01-15T23:21:31.212559","created_date":"2026-01-15T00:00:00"}
