{"id":"https://openalex.org/W4409139488","doi":"https://doi.org/10.1186/s40537-025-01142-5","title":"Evaluation of predictive performance of modeling hyperuricemia using medical big data: comparison of data preprocessing methods","display_name":"Evaluation of predictive performance of modeling hyperuricemia using medical big data: comparison of data preprocessing methods","publication_year":2025,"publication_date":"2025-04-03","ids":{"openalex":"https://openalex.org/W4409139488","doi":"https://doi.org/10.1186/s40537-025-01142-5"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-025-01142-5","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01142-5","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01142-5.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01142-5.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046543311","display_name":"Luwei Li","orcid":null},"institutions":[{"id":"https://openalex.org/I176134282","display_name":"Guilin Medical University","ror":"https://ror.org/000prga03","country_code":"CN","type":"education","lineage":["https://openalex.org/I176134282"]},{"id":"https://openalex.org/I4210126060","display_name":"First Affiliated Hospital of GuangXi Medical University","ror":"https://ror.org/030sc3x20","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210126060"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Luwei Li","raw_affiliation_strings":["Department of Rheumatology and Immunology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","Guilin Medical University, Guilin, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Rheumatology and Immunology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]},{"raw_affiliation_string":"Guilin Medical University, Guilin, Guangxi, China","institution_ids":["https://openalex.org/I176134282"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102578791","display_name":"Xian Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126060","display_name":"First Affiliated Hospital of GuangXi Medical University","ror":"https://ror.org/030sc3x20","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210126060"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xian Huang","raw_affiliation_strings":["Department of Rheumatology and Immunology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Rheumatology and Immunology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Cijin Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126060","display_name":"First Affiliated Hospital of GuangXi Medical University","ror":"https://ror.org/030sc3x20","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210126060"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cijin Yan","raw_affiliation_strings":["Department of Endocrinology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Endocrinology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011186506","display_name":"Shan He","orcid":"https://orcid.org/0000-0003-1694-1465"},"institutions":[{"id":"https://openalex.org/I4210126060","display_name":"First Affiliated Hospital of GuangXi Medical University","ror":"https://ror.org/030sc3x20","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210126060"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuzhan He","raw_affiliation_strings":["Department of Endocrinology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Endocrinology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Sishuai Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I176134282","display_name":"Guilin Medical University","ror":"https://ror.org/000prga03","country_code":"CN","type":"education","lineage":["https://openalex.org/I176134282"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sishuai Cheng","raw_affiliation_strings":["Guilin Medical University, Guilin, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Guilin Medical University, Guilin, Guangxi, China","institution_ids":["https://openalex.org/I176134282"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010466648","display_name":"Wenjie Yang","orcid":"https://orcid.org/0000-0002-3959-5043"},"institutions":[{"id":"https://openalex.org/I4210126060","display_name":"First Affiliated Hospital of GuangXi Medical University","ror":"https://ror.org/030sc3x20","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210126060"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"WenJie Yang","raw_affiliation_strings":["Department of Hematology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, No. 3, FoZiLing Road, Qingxiu District, Nanning, Guangxi, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Hematology, Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]},{"raw_affiliation_string":"Guangxi Hospital Division of The First Affiliated Hospital, Sun Yat-sen University, No. 3, FoZiLing Road, Qingxiu District, Nanning, Guangxi, China","institution_ids":["https://openalex.org/I4210126060"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5010466648"],"corresponding_institution_ids":["https://openalex.org/I4210126060"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06649349,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12647","display_name":"Traditional Chinese Medicine Studies","score":0.9671000242233276,"subfield":{"id":"https://openalex.org/subfields/2707","display_name":"Complementary and alternative medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9398000240325928,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8122386932373047},{"id":"https://openalex.org/keywords/hyperuricemia","display_name":"Hyperuricemia","score":0.7799460887908936},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.7365915775299072},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.6596850156784058},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5763903856277466},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.5620032548904419},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5006453990936279},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36319130659103394},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3520011901855469},{"id":"https://openalex.org/keywords/uric-acid","display_name":"Uric acid","score":0.18345212936401367},{"id":"https://openalex.org/keywords/internal-medicine","display_name":"Internal medicine","score":0.1346994936466217},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.11755242943763733}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8122386932373047},{"id":"https://openalex.org/C2779721657","wikidata":"https://www.wikidata.org/wiki/Q49970","display_name":"Hyperuricemia","level":3,"score":0.7799460887908936},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.7365915775299072},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.6596850156784058},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5763903856277466},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.5620032548904419},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5006453990936279},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36319130659103394},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3520011901855469},{"id":"https://openalex.org/C2779881121","wikidata":"https://www.wikidata.org/wiki/Q105522","display_name":"Uric acid","level":2,"score":0.18345212936401367},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.1346994936466217},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.11755242943763733}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-025-01142-5","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01142-5","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01142-5.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:cbf24dd159a44d43b0174c78ff7a0b48","is_oa":true,"landing_page_url":"https://doaj.org/article/cbf24dd159a44d43b0174c78ff7a0b48","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 12, Iss 1, Pp 1-17 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-025-01142-5","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01142-5","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01142-5.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320328746","display_name":"Guilin Medical University","ror":"https://ror.org/000prga03"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409139488.pdf"},"referenced_works_count":15,"referenced_works":["https://openalex.org/W184439366","https://openalex.org/W1631476648","https://openalex.org/W2177870565","https://openalex.org/W2576404523","https://openalex.org/W2799442961","https://openalex.org/W2800769566","https://openalex.org/W2916559661","https://openalex.org/W3009207988","https://openalex.org/W3166346970","https://openalex.org/W3193743240","https://openalex.org/W3193901151","https://openalex.org/W4283710895","https://openalex.org/W4320921006","https://openalex.org/W4365483206","https://openalex.org/W4383501045"],"related_works":["https://openalex.org/W2989490741","https://openalex.org/W3092506759","https://openalex.org/W2367545121","https://openalex.org/W4248881655","https://openalex.org/W2482165163","https://openalex.org/W3010890513","https://openalex.org/W120741642","https://openalex.org/W138569904","https://openalex.org/W2390914021","https://openalex.org/W2389417819"],"abstract_inverted_index":{"Using":[0],"medical":[1,373],"big":[2,374],"data":[3,16,37,42,70,74,91,124,384],"from":[4,43,54,75,78],"two":[5,34,148,177],"large-scale":[6],"populations,":[7],"a":[8,18,65,86,195,244],"prediction":[9,19,313],"model":[10,20,356,365,392],"for":[11,21,192,385],"continuous":[12,111,119,186,238,294,309,354,379],"variables":[13,23,112,120,199,224,239,248,264,268],"of":[14,32,36,48,67,88,110,146,175,184,197,206,215,231,237,246,255,262,275,280,284,301,319,330,340,352,361,371,382],"raw":[15,115,123,383],"and":[17,98,132,159,172,289,315,322,337,343,417],"categorical":[22,130,217,263,302,332,363,397],"after":[24,190,400],"assignment":[25,412],"were":[26,58,92,102,125,163],"constructed":[27],"to":[28,56,80,104,128,141,165],"evaluate":[29,167],"the":[30,33,44,61,83,108,114,118,122,138,143,147,168,176,180,185,204,211,216,229,233,241,253,273,281,308,316,320,331,341,349,353,362,368,378,396,403],"performance":[31,393],"forms":[35],"preprocessing":[38],"models.":[39,149,178],"Partial":[40],"population":[41,69,73,90],"physical":[45],"examination":[46],"center":[47],"Guilin":[49],"Medical":[50],"University":[51],"Affiliated":[52],"Hospital":[53],"2017":[55],"2019":[57],"selected":[59],"as":[60,82,407],"modeling":[62,188,219,321,342],"group,":[63,85],"with":[64,293],"total":[66,87,196,245],"22,124":[68],"included.":[71,93],"Selecting":[72],"NHANES":[76],"database":[77],"1998":[79],"2018":[81],"control":[84],"28,021":[89],"Logistic":[94,181,212,234,259,285],"regression,":[95],"LightGBM":[96,287],"model,":[97],"Deep":[99,290],"Neural":[100,291],"Network":[101],"used":[103],"predict":[105],"hyperuricemia":[106,372],"in":[107,113,121,203,228,240,252,272,390],"form":[109,381,399],"data.":[116],"Then,":[117],"assigned":[126],"values":[127,145,279],"become":[129],"variables,":[131],"statistical":[133,201,226,250,270,369,386,416],"analysis":[134,162,183,214,236,261,370,387],"was":[135],"performed":[136,164],"using":[137,377,395],"same":[139],"algorithm":[140],"obtain":[142],"predicted":[144],"ROC":[150,282],"curve":[151,154,157,161,312,314,318,336,339],"analysis,":[152,155,158],"Calibration":[153],"DCA":[156,335],"CIC":[160,338],"comprehensively":[166],"accuracy,":[169],"discriminatory":[170],"ability,":[171],"clinical":[173,350,418],"practicality":[174,351],"In":[179,367],"regression":[182,213,235,260],"variable":[187,218,295,310,355,364,380,398],"group":[189,220],"controlling":[191],"confounding":[193],"factors,":[194],"11":[198],"showed":[200,221,249,265],"significance":[202,227,251,271],"incidence":[205,230,254,274],"hyperuricemia.":[207,256,276],"After":[208,257],"assigning":[209],"values,":[210],"that":[222,266,329,348,360],"9":[223],"had":[225,269],"hyperuricemia.In":[232],"validation":[242,323,344],"set,":[243],"8":[247],"assignment,":[258],"10":[267],"The":[277,304,334],"AUC":[278],"curves":[283],"models,":[286,288],"Networks":[292],"types":[296],"are":[297],"higher":[298,358],"than":[299,328,359,394],"those":[300],"variables.":[303,333],"average":[305],"deviation":[306],"between":[307],"calibration":[311],"standard":[317],"groups":[324,345],"is":[325,357],"generally":[326],"lower":[327],"both":[346],"show":[347],"group.":[366],"data,":[375],"directly":[376],"may":[388,413],"result":[389],"better":[391],"assignment.":[401],"However,":[402],"relevant":[404],"parameters":[405],"such":[406],"OR":[408],"value":[409],"obtained":[410],"through":[411],"have":[414],"greater":[415],"guidance":[419],"significance.":[420]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
