{"id":"https://openalex.org/W3116910183","doi":"https://doi.org/10.1145/3479575","title":"Enabling Collaborative Data Science Development with the Ballet Framework","display_name":"Enabling Collaborative Data Science Development with the Ballet Framework","publication_year":2021,"publication_date":"2021-10-13","ids":{"openalex":"https://openalex.org/W3116910183","doi":"https://doi.org/10.1145/3479575","mag":"3116910183"},"language":"en","primary_location":{"id":"doi:10.1145/3479575","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3479575","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3479575","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3479575","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103970214","display_name":"Micah J. Smith","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Micah J. Smith","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033732305","display_name":"J\u00fcrgen Cito","orcid":"https://orcid.org/0000-0001-8619-1271"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"J\u00fcrgen Cito","raw_affiliation_strings":["TU Wien, Vienna, Austria"],"affiliations":[{"raw_affiliation_string":"TU Wien, Vienna, Austria","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039251903","display_name":"Kelvin Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kelvin Lu","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067352490","display_name":"Kalyan Veeramachaneni","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kalyan Veeramachaneni","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103970214"],"corresponding_institution_ids":["https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":1.9871,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.88412919,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"5","issue":"CSCW2","first_page":"1","last_page":"39"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6743251085281372},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6645286083221436},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5632505416870117},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5593384504318237},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5091013312339783},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.4977474510669708},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.4924798905849457},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.48674821853637695},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4834502637386322},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.4639975428581238},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.42168253660202026},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.4162721633911133},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23507067561149597},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.15798380970954895},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0980159342288971}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6743251085281372},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6645286083221436},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5632505416870117},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5593384504318237},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5091013312339783},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.4977474510669708},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4924798905849457},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.48674821853637695},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4834502637386322},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.4639975428581238},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.42168253660202026},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.4162721633911133},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23507067561149597},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.15798380970954895},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0980159342288971},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3479575","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3479575","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3479575","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2012.07816","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.07816","pdf_url":"https://arxiv.org/pdf/2012.07816","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3479575","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3479575","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3479575","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1726388308","display_name":null,"funder_award_id":"1761812","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3116910183.pdf","grobid_xml":"https://content.openalex.org/works/W3116910183.grobid-xml"},"referenced_works_count":109,"referenced_works":["https://openalex.org/W959575565","https://openalex.org/W1559060276","https://openalex.org/W1592081868","https://openalex.org/W1612277053","https://openalex.org/W1646083338","https://openalex.org/W1728842521","https://openalex.org/W1745177676","https://openalex.org/W1754293002","https://openalex.org/W1978623209","https://openalex.org/W2036398651","https://openalex.org/W2040915209","https://openalex.org/W2048499643","https://openalex.org/W2066305262","https://openalex.org/W2092939357","https://openalex.org/W2094485533","https://openalex.org/W2096547436","https://openalex.org/W2109306884","https://openalex.org/W2109426455","https://openalex.org/W2120314896","https://openalex.org/W2132862423","https://openalex.org/W2139092060","https://openalex.org/W2144160189","https://openalex.org/W2151245650","https://openalex.org/W2153338628","https://openalex.org/W2157289187","https://openalex.org/W2158685692","https://openalex.org/W2160175301","https://openalex.org/W2161336914","https://openalex.org/W2162565205","https://openalex.org/W2162739315","https://openalex.org/W2182353144","https://openalex.org/W2185914977","https://openalex.org/W2189162242","https://openalex.org/W2257550357","https://openalex.org/W2267596186","https://openalex.org/W2326713822","https://openalex.org/W2341535507","https://openalex.org/W2404161646","https://openalex.org/W2406996511","https://openalex.org/W2460952518","https://openalex.org/W2472803348","https://openalex.org/W2514277889","https://openalex.org/W2559997609","https://openalex.org/W2565167788","https://openalex.org/W2565788456","https://openalex.org/W2584335703","https://openalex.org/W2584781382","https://openalex.org/W2589015465","https://openalex.org/W2736977076","https://openalex.org/W2738647029","https://openalex.org/W2768067395","https://openalex.org/W2771189628","https://openalex.org/W2782471262","https://openalex.org/W2784179836","https://openalex.org/W2784241156","https://openalex.org/W2796040126","https://openalex.org/W2802314367","https://openalex.org/W2804908284","https://openalex.org/W2805836090","https://openalex.org/W2807910285","https://openalex.org/W2898162267","https://openalex.org/W2898457785","https://openalex.org/W2899457449","https://openalex.org/W2913615284","https://openalex.org/W2941766203","https://openalex.org/W2945172243","https://openalex.org/W2946595616","https://openalex.org/W2947593054","https://openalex.org/W2950018712","https://openalex.org/W2963809228","https://openalex.org/W2970533824","https://openalex.org/W2971867419","https://openalex.org/W2972788276","https://openalex.org/W2983901715","https://openalex.org/W2983970366","https://openalex.org/W2983995785","https://openalex.org/W2998216295","https://openalex.org/W3005977564","https://openalex.org/W3009065172","https://openalex.org/W3011307848","https://openalex.org/W3012094108","https://openalex.org/W3013182397","https://openalex.org/W3022734214","https://openalex.org/W3026514254","https://openalex.org/W3029504795","https://openalex.org/W3035597669","https://openalex.org/W3037118121","https://openalex.org/W3037887271","https://openalex.org/W3042177439","https://openalex.org/W3043282784","https://openalex.org/W3085621369","https://openalex.org/W3100055683","https://openalex.org/W3100535899","https://openalex.org/W3104332093","https://openalex.org/W3105704032","https://openalex.org/W3106372104","https://openalex.org/W3120370895","https://openalex.org/W3123489069","https://openalex.org/W3124072882","https://openalex.org/W3125798375","https://openalex.org/W3133702157","https://openalex.org/W3149590808","https://openalex.org/W3160033795","https://openalex.org/W4240935443","https://openalex.org/W4285719527","https://openalex.org/W4287826698","https://openalex.org/W4288086169","https://openalex.org/W4288296172","https://openalex.org/W4392271976"],"related_works":["https://openalex.org/W2350278424","https://openalex.org/W2071432835","https://openalex.org/W4239401009","https://openalex.org/W4234371507","https://openalex.org/W1628824497","https://openalex.org/W4299534542","https://openalex.org/W2053441600","https://openalex.org/W1990401748","https://openalex.org/W2047586841","https://openalex.org/W2141018266"],"abstract_inverted_index":{"While":[0],"the":[1,53],"open-source":[2,59],"software":[3,14,90],"development":[4,72],"model":[5,43],"has":[6],"led":[7],"to":[8,30,44,82,89,109],"successful":[9],"large-scale":[10],"collaborations":[11,34],"in":[12,51],"building":[13],"systems,":[15],"data":[16,32,60],"science":[17,33,61],"projects":[18],"are":[19,86],"frequently":[20],"developed":[21],"by":[22],"individuals":[23],"or":[24],"small":[25],"teams.":[26],"We":[27,47,106],"describe":[28],"challenges":[29],"scaling":[31],"and":[35,40,68,91,95,123],"present":[36],"a":[37,63,83,111],"conceptual":[38],"framework":[39,56],"ML":[41,92],"programming":[42],"address":[45],"them.":[46],"instantiate":[48],"these":[49],"ideas":[50],"Ballet,":[52],"first":[54],"lightweight":[55],"for":[57,126],"collaborative,":[58],"through":[62],"focus":[64],"on":[65],"feature":[66,80,103],"engineering,":[67],"an":[69,101,116],"accompanying":[70],"cloud-based":[71],"environment.":[73],"Using":[74],"our":[75],"framework,":[76],"collaborators":[77],"incrementally":[78],"propose":[79],"definitions":[81],"repository":[84],"which":[85],"each":[87],"subjected":[88],"performance":[93],"validation":[94],"can":[96],"be":[97],"automatically":[98],"merged":[99],"into":[100],"executable":[102],"engineering":[104],"pipeline.":[105],"leverage":[107],"Ballet":[108],"conduct":[110],"case":[112],"study":[113],"analysis":[114],"of":[115,129],"income":[117],"prediction":[118],"problem":[119],"with":[120],"27":[121],"collaborators,":[122],"discuss":[124],"implications":[125],"future":[127],"designers":[128],"collaborative":[130],"projects.":[131]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2021-01-05T00:00:00"}
