{"id":"https://openalex.org/W4409647700","doi":"https://doi.org/10.5334/dsj-2025-013","title":"A Lightweight File System Based Approach to Getting Data Ready for Data Management Solutions","display_name":"A Lightweight File System Based Approach to Getting Data Ready for Data Management Solutions","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409647700","doi":"https://doi.org/10.5334/dsj-2025-013"},"language":"en","primary_location":{"id":"doi:10.5334/dsj-2025-013","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2025-013","pdf_url":"https://datascience.codata.org/articles/1853/files/680623a9e70d6.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://datascience.codata.org/articles/1853/files/680623a9e70d6.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036797365","display_name":"Albert K. Engstfeld","orcid":"https://orcid.org/0000-0002-9686-3948"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Albert K. Engstfeld","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-9686-3948","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082409898","display_name":"Johannes M. Hermann","orcid":"https://orcid.org/0000-0001-7119-1295"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Johannes M. Hermann","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0001-7119-1295","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058877196","display_name":"Nicolas G. H\u00f6rmann","orcid":"https://orcid.org/0000-0001-6944-5575"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nicolas G. H\u00f6rmann","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0001-6944-5575","affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5114353305","display_name":"Julian R\u00fcth","orcid":"https://orcid.org/0000-0002-3930-9107"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Julian R\u00fcth","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-3930-9107","affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5036797365"],"corresponding_institution_ids":[],"apc_list":{"value":350,"currency":"GBP","value_usd":429},"apc_paid":{"value":350,"currency":"GBP","value_usd":429},"fwci":7.1238,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.96200924,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"24","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7785240411758423},{"id":"https://openalex.org/keywords/data-management","display_name":"Data management","score":0.6073065996170044},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5697636008262634},{"id":"https://openalex.org/keywords/file-system","display_name":"File system","score":0.47566550970077515},{"id":"https://openalex.org/keywords/data-file","display_name":"Data file","score":0.45244520902633667},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3545692563056946},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.354171484708786},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3335392475128174}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7785240411758423},{"id":"https://openalex.org/C1668388","wikidata":"https://www.wikidata.org/wiki/Q1149776","display_name":"Data management","level":2,"score":0.6073065996170044},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5697636008262634},{"id":"https://openalex.org/C2780940931","wikidata":"https://www.wikidata.org/wiki/Q174989","display_name":"File system","level":2,"score":0.47566550970077515},{"id":"https://openalex.org/C171730128","wikidata":"https://www.wikidata.org/wiki/Q5227290","display_name":"Data file","level":2,"score":0.45244520902633667},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3545692563056946},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.354171484708786},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3335392475128174}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5334/dsj-2025-013","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2025-013","pdf_url":"https://datascience.codata.org/articles/1853/files/680623a9e70d6.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2b3bd5382dc04b1f8f772549e91197bc","is_oa":true,"landing_page_url":"https://doaj.org/article/2b3bd5382dc04b1f8f772549e91197bc","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data Science Journal, Vol 24, Pp 13-13 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.5334/dsj-2025-013","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2025-013","pdf_url":"https://datascience.codata.org/articles/1853/files/680623a9e70d6.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5099999904632568,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409647700.pdf","grobid_xml":"https://content.openalex.org/works/W4409647700.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1895982116","https://openalex.org/W1922832738","https://openalex.org/W2011301426","https://openalex.org/W2063116701","https://openalex.org/W2097398335","https://openalex.org/W2134865903","https://openalex.org/W2135625048","https://openalex.org/W2155354890","https://openalex.org/W2302501749","https://openalex.org/W2342249984","https://openalex.org/W2480733761","https://openalex.org/W2619484455","https://openalex.org/W2737733838","https://openalex.org/W2900930447","https://openalex.org/W2902696364","https://openalex.org/W2994728765","https://openalex.org/W3021229045","https://openalex.org/W3095449883","https://openalex.org/W3099161928","https://openalex.org/W3111427379","https://openalex.org/W3200572611","https://openalex.org/W3209575515","https://openalex.org/W4200089625","https://openalex.org/W4200223120","https://openalex.org/W4205228445","https://openalex.org/W4205738517","https://openalex.org/W4224286679","https://openalex.org/W4293212596","https://openalex.org/W4293768436","https://openalex.org/W4377096557","https://openalex.org/W4386740911","https://openalex.org/W4399849805"],"related_works":["https://openalex.org/W753420207","https://openalex.org/W2353896575","https://openalex.org/W2379000728","https://openalex.org/W2368354671","https://openalex.org/W2389631998","https://openalex.org/W2362483455","https://openalex.org/W2355113374","https://openalex.org/W2391476234","https://openalex.org/W37549629","https://openalex.org/W2113429681"],"abstract_inverted_index":{"According":[0],"to":[1,22,115],"the":[2,53,70,86,111,116,120,140,165,170,177,183,200],"FAIR":[3,99],"(findability,":[4],"accessibility,":[5],"interoperability,":[6],"and":[7,59,62,82,137,150,160,189],"reusability)":[8],"principles,":[9],"scientific":[10],"data":[11,24,61,100,147,153,178,181,195],"should":[12],"always":[13],"be":[14,80],"stored":[15],"with":[16,25,94,148,196],"machine-readable":[17,151],"descriptive":[18],"metadata.":[19,63],"Existing":[20],"solutions":[21],"store":[23],"metadata,":[26,152],"such":[27],"as":[28],"electronic":[29],"lab":[30],"notebooks":[31],"(ELN),":[32],"are":[33,204],"often":[34],"not":[35,39],"readily":[36],"available":[37],"or":[38,45],"sufficiently":[40],"generic":[41],"for":[42,57,163],"arbitrary":[43],"experimental":[44],"computational":[46],"results.":[47],"In":[48],"this":[49],"work,":[50],"we":[51],"present":[52],"open-source":[54],"echemdb":[55],"toolkit":[56,65,112],"creating":[58],"handling":[60],"The":[64,90,191],"is":[66,131],"running":[67],"entirely":[68],"on":[69,85,199],"file":[71,201],"system":[72,202],"level":[73,203],"using":[74,179],"a":[75,98,104,173],"file-based":[76],"approach,":[77],"which":[78],"can":[79],"adopted":[81],"adapted":[83],"locally":[84],"individual":[87],"user&rsquo;s":[88],"workstation.":[89],"approach":[91],"facilitates":[92],"integration":[93],"other":[95],"tools":[96],"in":[97,119],"life":[101],"cycle,":[102],"avoiding":[103],"complicated":[105],"server":[106],"setup.":[107],"This":[108],"also":[109,168],"makes":[110],"more":[113,127],"accessible":[114],"broader":[117],"audience":[118],"research":[121,146,184],"sector":[122],"since":[123],"no":[124],"understanding":[125],"of":[126,139,144,172,186,193],"sophisticated":[128],"database":[129],"technologies":[130],"required.":[132],"We":[133,167],"showcase":[134],"several":[135],"aspects":[136],"applications":[138],"toolkit:":[141],"automatic":[142],"annotation":[143],"raw":[145],"human-":[149],"conversion":[154,188],"into":[155],"standardised":[156],"frictionless":[157],"Data":[158],"Packages,":[159],"an":[161],"API":[162],"exploring":[164],"data.":[166],"illustrate":[169],"creation":[171],"web":[174],"framework":[175],"displaying":[176],"example":[180],"from":[182],"area":[185],"energy":[187],"storage.":[190],"benefits":[192],"storing":[194],"annotations":[197],"already":[198],"discussed.":[205]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
