{"id":"https://openalex.org/W4388018809","doi":"https://doi.org/10.1109/tbdata.2023.3328433","title":"Multilevel Stochastic Optimization for Imputation in Massive Medical Data Records","display_name":"Multilevel Stochastic Optimization for Imputation in Massive Medical Data Records","publication_year":2023,"publication_date":"2023-10-30","ids":{"openalex":"https://openalex.org/W4388018809","doi":"https://doi.org/10.1109/tbdata.2023.3328433"},"language":"en","primary_location":{"id":"doi:10.1109/tbdata.2023.3328433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2023.3328433","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005871534","display_name":"Wenrui Li","orcid":"https://orcid.org/0000-0002-6471-7911"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wenrui Li","raw_affiliation_strings":["Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100357661","display_name":"Xiaoyu Wang","orcid":"https://orcid.org/0009-0000-2707-5019"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoyu Wang","raw_affiliation_strings":["Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008996515","display_name":"Yuetian Sun","orcid":"https://orcid.org/0009-0000-4094-1380"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuetian Sun","raw_affiliation_strings":["Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019761838","display_name":"Sne\u017eana Milanovi\u0107","orcid":"https://orcid.org/0000-0002-4160-9221"},"institutions":[{"id":"https://openalex.org/I4210122020","display_name":"Sunovion (United States)","ror":"https://ror.org/030zc7t66","country_code":"US","type":"company","lineage":["https://openalex.org/I4210122020"]},{"id":"https://openalex.org/I867599234","display_name":"Vion Pharmaceuticals (United States)","ror":"https://ror.org/036dfq243","country_code":"US","type":"company","lineage":["https://openalex.org/I867599234"]},{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Snezana Milanovic","raw_affiliation_strings":["Sunovion Pharmaceuticals, Marlborough, MA, USA","Department of Mathematics & Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Sunovion Pharmaceuticals, Marlborough, MA, USA","institution_ids":["https://openalex.org/I867599234","https://openalex.org/I4210122020"]},{"raw_affiliation_string":"Department of Mathematics & Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070448763","display_name":"Mark Kon","orcid":"https://orcid.org/0000-0001-5902-9412"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark Kon","raw_affiliation_strings":["Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072005545","display_name":"Julio E. Castrill\u00f3n-Cand\u00e1s","orcid":"https://orcid.org/0000-0002-7913-8840"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Julio Enrique Castrill\u00f3n-Cand\u00e1s","raw_affiliation_strings":["Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics &#x0026; Statistics, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5005871534"],"corresponding_institution_ids":["https://openalex.org/I111088046"],"apc_list":null,"apc_paid":null,"fwci":1.0431,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.79118084,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"10","issue":"2","first_page":"122","last_page":"131"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10243","display_name":"Statistical Methods and Bayesian Inference","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10804","display_name":"Health Systems, Economic Evaluations, Quality of Life","score":0.9793999791145325,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7697016000747681},{"id":"https://openalex.org/keywords/kriging","display_name":"Kriging","score":0.5989934206008911},{"id":"https://openalex.org/keywords/healthcare-cost-and-utilization-project","display_name":"Healthcare Cost and Utilization Project","score":0.5595095753669739},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.5385172963142395},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.46645253896713257},{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.46456873416900635},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4342002868652344},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35184741020202637},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.2986615300178528}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7697016000747681},{"id":"https://openalex.org/C81692654","wikidata":"https://www.wikidata.org/wiki/Q225926","display_name":"Kriging","level":2,"score":0.5989934206008911},{"id":"https://openalex.org/C2779195980","wikidata":"https://www.wikidata.org/wiki/Q5691206","display_name":"Healthcare Cost and Utilization Project","level":3,"score":0.5595095753669739},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.5385172963142395},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.46645253896713257},{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.46456873416900635},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4342002868652344},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35184741020202637},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.2986615300178528},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tbdata.2023.3328433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2023.3328433","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6600000262260437}],"awards":[{"id":"https://openalex.org/G7800798193","display_name":null,"funder_award_id":"1736392","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"}],"funders":[{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W1695563742","https://openalex.org/W1744580911","https://openalex.org/W1822348759","https://openalex.org/W1925362168","https://openalex.org/W1979898537","https://openalex.org/W1983479840","https://openalex.org/W1987837329","https://openalex.org/W2002926750","https://openalex.org/W2033672086","https://openalex.org/W2060528584","https://openalex.org/W2061320421","https://openalex.org/W2071379353","https://openalex.org/W2078536667","https://openalex.org/W2091922944","https://openalex.org/W2100863906","https://openalex.org/W2106698088","https://openalex.org/W2117926105","https://openalex.org/W2127841934","https://openalex.org/W2134843796","https://openalex.org/W2269456039","https://openalex.org/W2480680997","https://openalex.org/W2529827714","https://openalex.org/W2763710617","https://openalex.org/W2792693509","https://openalex.org/W2801457640","https://openalex.org/W2803805253","https://openalex.org/W2890686416","https://openalex.org/W2897852178","https://openalex.org/W2902048196","https://openalex.org/W2962932373","https://openalex.org/W2962942717","https://openalex.org/W2963573392","https://openalex.org/W2964024268","https://openalex.org/W2980495984","https://openalex.org/W3035623224","https://openalex.org/W3037216933","https://openalex.org/W3048225388","https://openalex.org/W3118393384","https://openalex.org/W3144823608","https://openalex.org/W3154878394","https://openalex.org/W3159174445","https://openalex.org/W3170657538","https://openalex.org/W3179164182","https://openalex.org/W3210018692","https://openalex.org/W4288562516","https://openalex.org/W4295126926","https://openalex.org/W4300187280","https://openalex.org/W4300223101","https://openalex.org/W4312258136","https://openalex.org/W6637446835","https://openalex.org/W6676037594","https://openalex.org/W6751145664","https://openalex.org/W6752046673","https://openalex.org/W6752316588","https://openalex.org/W6754349710","https://openalex.org/W6758880176"],"related_works":["https://openalex.org/W2181530120","https://openalex.org/W4211215373","https://openalex.org/W2024529227","https://openalex.org/W2055961818","https://openalex.org/W2903115227","https://openalex.org/W1574575415","https://openalex.org/W3144172081","https://openalex.org/W3179858851","https://openalex.org/W2081476516","https://openalex.org/W2581984549"],"abstract_inverted_index":{"It":[0,150],"has":[1,151],"long":[2],"been":[3],"a":[4,36,44],"recognized":[5],"problem":[6,53],"that":[7,138],"many":[8],"datasets":[9,28],"contain":[10],"significant":[11],"levels":[12],"of":[13,23,54,99,183],"missing":[14],"numerical":[15],"data.":[16],"A":[17],"potentially":[18],"critical":[19],"predicate":[20],"for":[21,75,106,130],"application":[22,98],"machine":[24],"learning":[25,191],"methods":[26,101,157,186],"to":[27,51,102,169,180],"involves":[29],"addressing":[30],"this":[31,34,40,82,111],"problem.":[32],"However,":[33],"is":[35,62,70,85,88,147],"challenging":[37],"task.":[38],"In":[39,73],"paper,":[41],"we":[42],"apply":[43],"recently":[45],"developed":[46],"multi-level":[47,83,140],"stochastic":[48],"optimization":[49],"approach":[50,61,112],"the":[52,76,116,139,160,175,184],"imputation":[55,104],"in":[56,159,172],"massive":[57,107],"medical":[58],"records.":[59],"The":[60],"based":[63],"on":[64,113],"computational":[65],"applied":[66],"mathematics":[67],"techniques":[68],"and":[69,87,91,125,133,146],"highly":[71],"accurate.":[72],"particular,":[74],"Best":[77],"Linear":[78],"Unbiased":[79],"Predictor":[80],"(BLUP)":[81],"formulation":[84],"exact,":[86],"significantly":[89,142],"faster":[90],"more":[92],"numerically":[93,148],"stable.":[94],"This":[95],"permits":[96],"practical":[97],"Kriging":[100],"data":[103,114,121],"problems":[105],"datasets.":[108],"We":[109],"test":[110],"from":[115,163],"National":[117],"Inpatient":[118],"Sample":[119],"(NIS)":[120],"records,":[122],"Healthcare":[123,131],"Cost":[124],"Utilization":[126],"Project":[127],"(HCUP),":[128],"Agency":[129],"Research":[132],"Quality.":[134],"Numerical":[135],"results":[136,176],"show":[137,167],"method":[141],"outperforms":[143],"current":[144],"approaches":[145],"robust.":[149],"superior":[152,179],"accuracy":[153],"as":[154,188],"compared":[155],"with":[156],"recommended":[158],"recent":[161,181],"report":[162],"HCUP.":[164],"Benchmark":[165],"tests":[166],"up":[168],"75%":[170],"reductions":[171],"error.":[173],"Furthermore,":[174],"are":[177],"also":[178],"state":[182],"art":[185],"such":[187],"discriminative":[189],"deep":[190]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
