{"id":"https://openalex.org/W7140279896","doi":"https://doi.org/10.48550/arxiv.2603.22726","title":"A Study of Scientific Computational Notebook Quality","display_name":"A Study of Scientific Computational Notebook Quality","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140279896","doi":"https://doi.org/10.48550/arxiv.2603.22726"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22726","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048781214","display_name":"Shun Kashiwa","orcid":"https://orcid.org/0009-0001-3665-0182"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kashiwa, Shun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130558725","display_name":"Ayla Kurdak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kurdak, Ayla","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130608537","display_name":"Savitha Ravi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ravi, Savitha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130581811","display_name":"Ridhi Srikanth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Srikanth, Ridhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130563513","display_name":"Angel Thakur","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thakur, Angel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130612953","display_name":"Sonia Chandra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandra, Sonia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130590132","display_name":"Jonathan Truong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Truong, Jonathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044646652","display_name":"Michael Coblenz","orcid":"https://orcid.org/0000-0002-9369-4069"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Coblenz, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5048781214"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.904699981212616,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.904699981212616,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.049800001084804535,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.00559999980032444,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6858999729156494},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.6743999719619751},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5361999869346619},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.4819999933242798},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4438000023365021},{"id":"https://openalex.org/keywords/program-comprehension","display_name":"Program comprehension","score":0.43849998712539673},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.3968999981880188}],"concepts":[{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6858999729156494},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.6743999719619751},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6661999821662903},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5361999869346619},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.4819999933242798},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4438000023365021},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.43849998712539673},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.3968999981880188},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3887999951839447},{"id":"https://openalex.org/C81089528","wikidata":"https://www.wikidata.org/wiki/Q5134986","display_name":"clone (Java method)","level":3,"score":0.3628999888896942},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3596999943256378},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.35929998755455017},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.334199994802475},{"id":"https://openalex.org/C2781083858","wikidata":"https://www.wikidata.org/wiki/Q17327049","display_name":"Scientific literature","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.3125999867916107},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.302700012922287},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.29670000076293945},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C140396857","wikidata":"https://www.wikidata.org/wiki/Q16934771","display_name":"Internal documentation","level":5,"score":0.27090001106262207},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2644999921321869}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,174],"quality":[1,34],"of":[2,46,81,126,137,176],"scientific":[3,25,32,93,163],"code":[4,15,33,48,64,82,94],"is":[5],"a":[6,44],"critical":[7],"concern":[8],"for":[9,192],"the":[10,97,138,190],"research":[11],"community.":[12],"Poorly":[13],"written":[14],"can":[16],"result":[17],"in":[18,60,92,141],"irreproducible":[19],"results,":[20],"incorrect":[21],"findings,":[22],"and":[23,40,79,84,114,131,154,172,184,195,203],"slower":[24],"progress.":[26],"In":[27],"this":[28],"study,":[29],"we":[30,66,100],"evaluate":[31],"across":[35],"three":[36,132],"dimensions:":[37],"reproducibility,":[38],"readability,":[39],"reusability.":[41],"We":[42],"curated":[43],"corpus":[45],"518":[47],"repositories":[49],"by":[50],"analyzing":[51],"Code":[52,117],"Availability":[53],"statements":[54],"from":[55],"all":[56],"1239":[57],"Nature":[58],"publications":[59],"2024.":[61],"To":[62],"assess":[63],"quality,":[65],"employed":[67],"multiple":[68],"methods,":[69],"including":[70],"manual":[71],"attempts":[72],"to":[73,102,110,197],"reproduce":[74],"Jupyter":[75],"notebooks,":[76],"documentation":[77],"reviews,":[78],"analyses":[80],"clones":[83],"mutation":[85,159],"patterns.":[86],"Our":[87],"results":[88],"reveal":[89],"major":[90],"challenges":[91],"quality.":[95],"Of":[96],"19":[98],"notebooks":[99,140,164],"attempted":[101],"execute,":[103],"only":[104],"two":[105],"were":[106],"reproducible,":[107,201],"primarily":[108],"due":[109],"missing":[111],"data":[112,152],"files":[113],"dependency":[115],"issues.":[116],"duplication":[118],"was":[119],"also":[120],"common,":[121],"with":[122],"326":[123],"clone":[124],"classes":[125],"at":[127],"least":[128],"10":[129],"lines":[130],"instances":[133],"found":[134],"among":[135],"637":[136],"1510":[139],"our":[142,158],"corpus.":[143],"These":[144],"duplications":[145],"frequently":[146],"involved":[147],"tasks":[148],"such":[149],"as":[150],"visualization,":[151],"processing,":[153],"statistical":[155],"analysis.":[156],"Moreover,":[157],"analysis":[160],"showed":[161],"that":[162],"often":[165],"exhibit":[166],"tangled":[167,185],"state":[168,186],"changes,":[169],"complicating":[170],"comprehension":[171],"reasoning.":[173],"prevalence":[175],"these":[177],"issues":[178],"--":[179,188],"unreproducible":[180],"code,":[181],"widespread":[182],"duplication,":[183],"management":[187],"underscores":[189],"need":[191],"improved":[193],"tools":[194],"abstractions":[196],"help":[198],"science":[199],"build":[200],"readable":[202],"reusable":[204],"software.":[205]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-26T00:00:00"}
