{"id":"https://openalex.org/W2775447293","doi":"https://doi.org/10.3390/informatics4040045","title":"A Data Quality Strategy to Enable FAIR, Programmatic Access across Large, Diverse Data Collections for High Performance Data Analysis","display_name":"A Data Quality Strategy to Enable FAIR, Programmatic Access across Large, Diverse Data Collections for High Performance Data Analysis","publication_year":2017,"publication_date":"2017-12-13","ids":{"openalex":"https://openalex.org/W2775447293","doi":"https://doi.org/10.3390/informatics4040045","mag":"2775447293"},"language":"en","primary_location":{"id":"doi:10.3390/informatics4040045","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4040045","pdf_url":"https://www.mdpi.com/2227-9709/4/4/45/pdf?version=1513178354","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2227-9709/4/4/45/pdf?version=1513178354","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101957110","display_name":"Ben Evans","orcid":"https://orcid.org/0000-0002-6719-2671"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ben Evans","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":"https://orcid.org/0000-0002-6719-2671","affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042656956","display_name":"K. A. Druken","orcid":"https://orcid.org/0000-0002-9442-5709"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Kelsey Druken","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017647405","display_name":"Jingbo Wang","orcid":"https://orcid.org/0000-0002-3594-1893"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Jingbo Wang","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112337713","display_name":"Rui Yang","orcid":"https://orcid.org/0000-0001-8507-5631"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Rui Yang","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110561873","display_name":"Clare Richards","orcid":null},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Clare Richards","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004401344","display_name":"Lesley Wyborn","orcid":"https://orcid.org/0000-0001-5976-4943"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210141271","display_name":"National Computational Infrastructure","ror":"https://ror.org/04yx6dh41","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210141271"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Lesley Wyborn","raw_affiliation_strings":["National Computational Infrastructure, the Australian National University, Acton 2601, Australia"],"raw_orcid":"https://orcid.org/0000-0001-5976-4943","affiliations":[{"raw_affiliation_string":"National Computational Infrastructure, the Australian National University, Acton 2601, Australia","institution_ids":["https://openalex.org/I4210141271","https://openalex.org/I118347636"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5017647405"],"corresponding_institution_ids":["https://openalex.org/I118347636","https://openalex.org/I4210141271"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":1.5188,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.88253307,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"4","issue":"4","first_page":"45","last_page":"45"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.9714999794960022,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10770","display_name":"Soil Geostatistics and Mapping","score":0.9408000111579895,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interoperability","display_name":"Interoperability","score":0.7498090863227844},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7437527775764465},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7268459796905518},{"id":"https://openalex.org/keywords/standardization","display_name":"Standardization","score":0.634223461151123},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.5755122900009155},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.522047758102417},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5145937204360962},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.5046180486679077},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.5022313594818115},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41062843799591064},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3228219747543335},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.23087233304977417},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.2146182656288147}],"concepts":[{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.7498090863227844},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7437527775764465},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7268459796905518},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.634223461151123},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.5755122900009155},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.522047758102417},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5145937204360962},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.5046180486679077},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.5022313594818115},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41062843799591064},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3228219747543335},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.23087233304977417},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.2146182656288147},{"id":"https://openalex.org/C136264566","wikidata":"https://www.wikidata.org/wiki/Q159810","display_name":"Economy","level":1,"score":0.0},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/informatics4040045","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4040045","pdf_url":"https://www.mdpi.com/2227-9709/4/4/45/pdf?version=1513178354","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},{"id":"pmh:oai:openresearch-repository.anu.edu.au:1885/307399","is_oa":true,"landing_page_url":"http://hdl.handle.net/1885/307399","pdf_url":"https://openresearch-repository.anu.edu.au/bitstreams/643437bd-6da1-4442-85d1-81e4b4a98b04/download","source":{"id":"https://openalex.org/S4306402539","display_name":"ANU Open Research (Australian National University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I118347636","host_organization_name":"Australian National University","host_organization_lineage":["https://openalex.org/I118347636"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Informatics","raw_type":"Journal article"},{"id":"pmh:oai:doaj.org/article:731777df5b0e4616ba50e20d58921d63","is_oa":false,"landing_page_url":"https://doaj.org/article/731777df5b0e4616ba50e20d58921d63","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Informatics, Vol 4, Iss 4, p 45 (2017)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2227-9709/4/4/45/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/informatics4040045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Informatics; Volume 4; Issue 4; Pages: 45","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/informatics4040045","is_oa":true,"landing_page_url":"https://doi.org/10.3390/informatics4040045","pdf_url":"https://www.mdpi.com/2227-9709/4/4/45/pdf?version=1513178354","source":{"id":"https://openalex.org/S2738238905","display_name":"Informatics","issn_l":"2227-9709","issn":["2227-9709"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Informatics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6000000238418579}],"awards":[],"funders":[{"id":"https://openalex.org/F4320315885","display_name":"Australian Government","ror":"https://ror.org/0314h5y94"},{"id":"https://openalex.org/F4320320386","display_name":"Commonwealth Scientific and Industrial Research Organisation","ror":"https://ror.org/03qn8fb07"},{"id":"https://openalex.org/F4320320431","display_name":"Australian National University","ror":"https://ror.org/019wvm592"},{"id":"https://openalex.org/F4320337351","display_name":"National Cancer Institute","ror":"https://ror.org/040gcmg81"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2775447293.pdf","grobid_xml":"https://content.openalex.org/works/W2775447293.grobid-xml"},"referenced_works_count":6,"referenced_works":["https://openalex.org/W2513244281","https://openalex.org/W2534495653","https://openalex.org/W2559901458","https://openalex.org/W2735983859","https://openalex.org/W2989903325","https://openalex.org/W3012514476"],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W2059640416","https://openalex.org/W1490753184","https://openalex.org/W2284465472","https://openalex.org/W2291782699","https://openalex.org/W1993948687","https://openalex.org/W2011676020","https://openalex.org/W2000169967"],"abstract_inverted_index":{"To":[0,160],"ensure":[1],"seamless,":[2],"programmatic":[3,130,193],"access":[4,136],"to":[5,21,135,155,178,185],"data":[6,29,55,88,163],"for":[7,25,58,147,182,190],"High":[8,60],"Performance":[9,61],"Computing":[10],"(HPC)":[11],"and":[12,30,82,92,98,113,123,146],"analysis":[13,152],"across":[14,94,118],"multiple":[15],"research":[16],"domains,":[17,122],"it":[18],"is":[19,175],"vital":[20],"have":[22,40,106],"a":[23,42,59],"methodology":[24],"standardization":[26],"of":[27,54,78,87,115],"both":[28],"services.":[31,99],"At":[32],"the":[33,102,111,116,119,125,137,173,180,186],"Australian":[34],"National":[35],"Computational":[36],"Infrastructure":[37],"(NCI)":[38],"we":[39,105],"developed":[41],"Data":[43,62],"Quality":[44,66,84],"Strategy":[45],"(DQS)":[46],"that":[47],"currently":[48],"provides":[49],"processes":[50],"for:":[51],"(1)":[52],"Consistency":[53],"structures":[56],"needed":[57],"(HPD)":[63],"platform;":[64],"(2)":[65],"Control":[67],"(QC)":[68],"through":[69,89,154],"compliance":[70],"with":[71],"recognized":[72],"community":[73],"standards;":[74],"(3)":[75],"Benchmarking":[76],"cases":[77],"operational":[79],"performance":[80,93,171],"tests;":[81],"(4)":[83],"Assurance":[85],"(QA)":[86],"demonstrated":[90,124],"functionality":[91],"common":[95],"platforms,":[96],"tools":[97],"By":[100],"implementing":[101],"NCI":[103],"DQS,":[104],"seen":[107],"progressive":[108],"improvement":[109],"in":[110,140,169],"quality":[112],"usefulness":[114],"datasets":[117],"different":[120],"subject":[121],"ease":[126],"by":[127,165],"which":[128],"modern":[129],"methods":[131,153],"can":[132],"be":[133],"used":[134,177],"data,":[138],"either":[139],"situ":[141],"or":[142],"via":[143],"web":[144],"services,":[145],"uses":[148],"ranging":[149],"from":[150],"traditional":[151],"emerging":[156],"machine":[157],"learning":[158],"techniques.":[159],"help":[161],"increase":[162],"re-usability":[164],"broader":[166],"communities,":[167],"particularly":[168],"high":[170],"environments,":[172],"DQS":[174],"also":[176],"identify":[179],"need":[181],"any":[183],"extensions":[184],"relevant":[187],"international":[188],"standards":[189],"interoperability":[191],"and/or":[192],"access.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
