{"id":"https://openalex.org/W4320024352","doi":"https://doi.org/10.1109/bigdata55660.2022.10020258","title":"Review of Publically Available Health Big Data Sets","display_name":"Review of Publically Available Health Big Data Sets","publication_year":2022,"publication_date":"2022-12-17","ids":{"openalex":"https://openalex.org/W4320024352","doi":"https://doi.org/10.1109/bigdata55660.2022.10020258"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata55660.2022.10020258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata55660.2022.10020258","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102854055","display_name":"Dillon Chrimes","orcid":"https://orcid.org/0000-0003-4350-9360"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Dillon Chrimes","raw_affiliation_strings":["University of Victoria,School of Health Information Science,Victoria,Canada","School of Health Information Science, University of Victoria, Victoria, Canada"],"affiliations":[{"raw_affiliation_string":"University of Victoria,School of Health Information Science,Victoria,Canada","institution_ids":["https://openalex.org/I212119943"]},{"raw_affiliation_string":"School of Health Information Science, University of Victoria, Victoria, Canada","institution_ids":["https://openalex.org/I212119943"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101584998","display_name":"Chanhee Kim","orcid":"https://orcid.org/0000-0003-0441-4107"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Chanhee Kim","raw_affiliation_strings":["University of Victoria,School of Health Information Science,Victoria,Canada","School of Health Information Science, University of Victoria, Victoria, Canada"],"affiliations":[{"raw_affiliation_string":"University of Victoria,School of Health Information Science,Victoria,Canada","institution_ids":["https://openalex.org/I212119943"]},{"raw_affiliation_string":"School of Health Information Science, University of Victoria, Victoria, Canada","institution_ids":["https://openalex.org/I212119943"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102854055"],"corresponding_institution_ids":["https://openalex.org/I212119943"],"apc_list":null,"apc_paid":null,"fwci":1.0293,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76754151,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"6625","last_page":"6627"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10350","display_name":"Electronic Health Records Systems","score":0.9790999889373779,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/health-informatics","display_name":"Health informatics","score":0.735168993473053},{"id":"https://openalex.org/keywords/public-health-informatics","display_name":"Public health informatics","score":0.6501753330230713},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6424412131309509},{"id":"https://openalex.org/keywords/informatics","display_name":"Informatics","score":0.6186915636062622},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.5237381458282471},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5021977424621582},{"id":"https://openalex.org/keywords/dashboard","display_name":"Dashboard","score":0.4917588531970978},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.45647531747817993},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4080049395561218},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.40330636501312256},{"id":"https://openalex.org/keywords/public-health","display_name":"Public health","score":0.3778524696826935},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.17831572890281677},{"id":"https://openalex.org/keywords/health-policy","display_name":"Health policy","score":0.13950783014297485},{"id":"https://openalex.org/keywords/international-health","display_name":"International health","score":0.12203732132911682},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.101683109998703}],"concepts":[{"id":"https://openalex.org/C145642194","wikidata":"https://www.wikidata.org/wiki/Q870895","display_name":"Health informatics","level":3,"score":0.735168993473053},{"id":"https://openalex.org/C106476913","wikidata":"https://www.wikidata.org/wiki/Q7257747","display_name":"Public health informatics","level":5,"score":0.6501753330230713},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6424412131309509},{"id":"https://openalex.org/C191630685","wikidata":"https://www.wikidata.org/wiki/Q4027615","display_name":"Informatics","level":2,"score":0.6186915636062622},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.5237381458282471},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5021977424621582},{"id":"https://openalex.org/C33499554","wikidata":"https://www.wikidata.org/wiki/Q1417134","display_name":"Dashboard","level":2,"score":0.4917588531970978},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45647531747817993},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4080049395561218},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.40330636501312256},{"id":"https://openalex.org/C138816342","wikidata":"https://www.wikidata.org/wiki/Q189603","display_name":"Public health","level":2,"score":0.3778524696826935},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.17831572890281677},{"id":"https://openalex.org/C47344431","wikidata":"https://www.wikidata.org/wiki/Q1519812","display_name":"Health policy","level":3,"score":0.13950783014297485},{"id":"https://openalex.org/C193395930","wikidata":"https://www.wikidata.org/wiki/Q3247219","display_name":"International health","level":4,"score":0.12203732132911682},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.101683109998703},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.0},{"id":"https://openalex.org/C159110408","wikidata":"https://www.wikidata.org/wiki/Q121176","display_name":"Nursing","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata55660.2022.10020258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata55660.2022.10020258","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310932","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1871443204","https://openalex.org/W2010911732","https://openalex.org/W2018827783","https://openalex.org/W2162800060","https://openalex.org/W2994011281","https://openalex.org/W3195621356","https://openalex.org/W3213293058","https://openalex.org/W4239720002","https://openalex.org/W6770964161"],"related_works":["https://openalex.org/W2993510912","https://openalex.org/W4309825515","https://openalex.org/W3171051968","https://openalex.org/W144292345","https://openalex.org/W2320523353","https://openalex.org/W2328348909","https://openalex.org/W2524836550","https://openalex.org/W2114696480","https://openalex.org/W3124660266","https://openalex.org/W3165531497"],"abstract_inverted_index":{"There":[0],"is":[1,392],"a":[2,43,255,269,384],"growing":[3],"interest":[4],"in":[5,29,54,216,238,305,383,406],"using":[6,147,170],"public":[7,59,116],"data":[8,27,48,51,60,121,129,141,165,180,188,200,206,219,240,244,263,300,319,337,355,361],"for":[9,90,291,315,320,398,403],"open":[10],"government":[11],"policy":[12],"involving":[13],"health":[14,30,37,125,149,158,316,363,407],"informatics":[15,31,150,159,364],"and":[16,42,105,160,211,223,229,231,253,289,312,326,349,365],"healthcare":[17,40,161,366],"systems.":[18],"This":[19],"paper":[20],"investigated":[21],"the":[22,77,148,155,173,178,204,217,227,262,277,381],"characteristics":[23],"of":[24,45,58,157,177,187,260,280,299,360,387],"publically":[25],"available":[26],"sets":[28,61,122,130,166,181,220,298,338,356],"that":[32,62,81,119,131,135,266],"were":[33,79,144,167,182,190,221,286,323,344],"derived":[34],"from":[35,137,183,276,324,345],"electronic":[36,310],"records":[38,311],"(EHRs),":[39],"systems,":[41,162],"variety":[44],"open-government":[46],"libraries,":[47],"marts,":[49],"or":[50],"catalogues.Data":[52],"used":[53,80,268,303],"this":[55],"study":[56],"consisted":[57],"did":[63],"not":[64],"require":[65],"any":[66,214],"registration":[67],"to":[68,124,192,251,264,333,341,379,394,400],"access":[69],"online.":[70],"In":[71],"total,":[72],"nine":[73,373],"web-based":[74],"platforms":[75,112,374],"on":[76,226],"Internet":[78],"included:":[82],"British":[83],"Columbia":[84],"(BC)":[85],"Data":[86,270,285,351],"Catalogue,":[87,352],"Canadian":[88],"Institute":[89],"Health":[91],"Information":[92],"(CIHI),":[93],"Harvard":[94],"Dataverse,":[95,347],"MIMIC-eICU,":[96,325],"FigShare,":[97,346],"GitHub,":[98],"Google":[99],"Dataset,":[100],"UCI":[101],"Machine":[102],"Learning":[103],"Repository,":[104],"Zenodo.":[106],"Our":[107],"initial":[108],"search":[109,133,151,377],"across":[110],"these":[111,242],"found":[113,127,146,168],"over":[114],"10,000":[115],"use":[117],"files":[118,402],"had":[120,203],"related":[123,362],"informatics.We":[126],"558":[128,218],"matched":[132],"criterion":[134],"ranged":[136],"years":[138],"2013-2022.":[139],"The":[140,185,194,336],"source":[142],"types":[143],"mostly":[145],"filters":[152],"followed":[153,208],"by":[154,197,209],"combination":[156],"but":[163],"fewer":[164],"when":[169],"EHR":[171],"as":[172],"criterion.":[174],"Almost":[175],"85%":[176],"total":[179],"2020-2022.":[184],"range":[186],"sizes":[189],"11KB":[191],"7.8MB.":[193],"eICU":[195],"(hosted":[196],"MIT\u2019s":[198],"MIMIC":[199],"mart)":[201],"platform":[202],"largest":[205],"set":[207],"Zenodo,":[210],"GitHub.":[212],"Additionally,":[213],"bioinformatics":[215],"excluded":[222],"further":[224,247],"classification":[225],"content":[228],"usability,":[230],"dashboard":[232,256,321],"visualization":[233,397],"towards":[234],"experiential":[235,404],"learning":[236,405],"resulted":[237],"117":[239,243],"sets.Of":[241],"sets,":[245],"we":[246],"tested":[248],"their":[249],"usability":[250,322,343,359],"graph":[252],"create":[254],"within":[257],"2-5":[258],"minutes":[259],"loading":[261],"Tableau\u00a9":[265],"then":[267],"Usability":[271,282],"Scale":[272,283],"(DUS)":[273],"scoring":[274],"developed":[275],"industry":[278],"standard":[279],"System":[281],"(SUS).":[284],"deemed":[287],"usable":[288],"useful":[290],">60%":[292],"average":[293],"DUS":[294],"scoring.":[295],"Finally,":[296],"25":[297,354],"could":[301],"be":[302],"effectively":[304],"classroom":[306],"exercises":[307],"dealing":[308],"with":[309,339,357],"decision":[313],"support":[314],"care.":[317],"Best":[318],"other":[327],"websites":[328],"like":[329],"Zenodo":[330],"produced":[331],"low":[332,340],"high":[334,358],"usability.":[335,370],"poor":[342],"CIHI,":[348],"BC":[350],"respectively.Overall,":[353],"systems":[367],"showed":[368,375],"60-85%":[369],"Moreover,":[371],"all":[372],"ease-of-use":[376],"patterns":[378],"establish":[380],"criteria":[382],"short":[385],"amount":[386],"time.":[388],"However,":[389],"more":[390],"investigation":[391],"needed":[393],"compare":[395],"data-to-dashboard":[396],"single":[399],"multiple":[401],"informatics.":[408]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
