{"id":"https://openalex.org/W3135371071","doi":"https://doi.org/10.1145/3442188.3445918","title":"Towards Accountability for Machine Learning Datasets: Practices from Software Engineering and Infrastructure","display_name":"Towards Accountability for Machine Learning Datasets: Practices from Software Engineering and Infrastructure","publication_year":2021,"publication_date":"2021-03-01","ids":{"openalex":"https://openalex.org/W3135371071","doi":"https://doi.org/10.1145/3442188.3445918","mag":"3135371071"},"language":"en","primary_location":{"id":"doi:10.1145/3442188.3445918","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3442188.3445918","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3442188.3445918","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 ACM Conference on Fairness, Accountability, and Transparency","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3442188.3445918","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071599724","display_name":"Ben Hutchinson","orcid":"https://orcid.org/0000-0003-2253-6204"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ben Hutchinson","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077833261","display_name":"Andrew Smart","orcid":"https://orcid.org/0000-0002-9816-7348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andrew Smart","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025947434","display_name":"Alex Hanna","orcid":"https://orcid.org/0000-0002-8957-0813"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alex Hanna","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045383831","display_name":"Emily Denton","orcid":"https://orcid.org/0000-0003-4915-0512"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Remi Denton","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041666220","display_name":"Christina Greer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christina Greer","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024402566","display_name":"Oddur Kjartansson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oddur Kjartansson","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001087250","display_name":"Parker Barnes","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parker Barnes","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046235098","display_name":"Margaret Mitchell","orcid":"https://orcid.org/0000-0001-7043-6545"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Margaret Mitchell","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5071599724"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":35.346,"has_fulltext":true,"cited_by_count":230,"citation_normalized_percentile":{"value":0.99915141,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"560","last_page":"575"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11891","display_name":"Big Data and Business Intelligence","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/accountability","display_name":"Accountability","score":0.8310607075691223},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7108843922615051},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.7011008858680725},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5412963628768921},{"id":"https://openalex.org/keywords/deliberation","display_name":"Deliberation","score":0.5046032667160034},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.4946725070476532},{"id":"https://openalex.org/keywords/process-management","display_name":"Process management","score":0.4852299690246582},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.443929523229599},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.43655189871788025},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.3324708342552185},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.2988021969795227},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.19762268662452698},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.13212618231773376},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.11121487617492676}],"concepts":[{"id":"https://openalex.org/C2776007630","wikidata":"https://www.wikidata.org/wiki/Q2798912","display_name":"Accountability","level":2,"score":0.8310607075691223},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7108843922615051},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.7011008858680725},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5412963628768921},{"id":"https://openalex.org/C2776946740","wikidata":"https://www.wikidata.org/wiki/Q358652","display_name":"Deliberation","level":3,"score":0.5046032667160034},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.4946725070476532},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.4852299690246582},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.443929523229599},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.43655189871788025},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3324708342552185},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2988021969795227},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.19762268662452698},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.13212618231773376},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.11121487617492676},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3442188.3445918","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3442188.3445918","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3442188.3445918","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 ACM Conference on Fairness, Accountability, and Transparency","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3442188.3445918","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3442188.3445918","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3442188.3445918","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 ACM Conference on Fairness, Accountability, and Transparency","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3135371071.pdf","grobid_xml":"https://content.openalex.org/works/W3135371071.grobid-xml"},"referenced_works_count":130,"referenced_works":["https://openalex.org/W13846533","https://openalex.org/W14162785","https://openalex.org/W49673716","https://openalex.org/W380289026","https://openalex.org/W386536775","https://openalex.org/W632553690","https://openalex.org/W774135413","https://openalex.org/W1482657684","https://openalex.org/W1490781083","https://openalex.org/W1498112155","https://openalex.org/W1509880128","https://openalex.org/W1562037863","https://openalex.org/W1578561991","https://openalex.org/W1601300738","https://openalex.org/W1808244176","https://openalex.org/W1819662813","https://openalex.org/W1898560071","https://openalex.org/W1963547174","https://openalex.org/W1963574588","https://openalex.org/W1964477621","https://openalex.org/W1974219838","https://openalex.org/W1978743011","https://openalex.org/W1990921190","https://openalex.org/W1996934409","https://openalex.org/W2003823216","https://openalex.org/W2004052545","https://openalex.org/W2010793828","https://openalex.org/W2013561467","https://openalex.org/W2014516359","https://openalex.org/W2034110087","https://openalex.org/W2035495373","https://openalex.org/W2042349004","https://openalex.org/W2045657963","https://openalex.org/W2099057120","https://openalex.org/W2103018059","https://openalex.org/W2103107119","https://openalex.org/W2125436846","https://openalex.org/W2126644472","https://openalex.org/W2147603330","https://openalex.org/W2148259819","https://openalex.org/W2156926624","https://openalex.org/W2185308952","https://openalex.org/W2189162242","https://openalex.org/W2251818205","https://openalex.org/W2291288208","https://openalex.org/W2317672285","https://openalex.org/W2334930053","https://openalex.org/W2399925489","https://openalex.org/W2463528414","https://openalex.org/W2477591003","https://openalex.org/W2510954301","https://openalex.org/W2513125375","https://openalex.org/W2527889223","https://openalex.org/W2553317877","https://openalex.org/W2554886295","https://openalex.org/W2557671501","https://openalex.org/W2576379123","https://openalex.org/W2598446296","https://openalex.org/W2605847787","https://openalex.org/W2607302851","https://openalex.org/W2610778097","https://openalex.org/W2623360248","https://openalex.org/W2716311441","https://openalex.org/W2739349903","https://openalex.org/W2743948853","https://openalex.org/W2769358515","https://openalex.org/W2770618123","https://openalex.org/W2782864149","https://openalex.org/W2791094827","https://openalex.org/W2794583223","https://openalex.org/W2804897457","https://openalex.org/W2807760453","https://openalex.org/W2897042519","https://openalex.org/W2897154134","https://openalex.org/W2897702578","https://openalex.org/W2903995489","https://openalex.org/W2905588001","https://openalex.org/W2910548926","https://openalex.org/W2911227954","https://openalex.org/W2912876187","https://openalex.org/W2913700606","https://openalex.org/W2914228034","https://openalex.org/W2922234936","https://openalex.org/W2944221325","https://openalex.org/W2944420931","https://openalex.org/W2948917818","https://openalex.org/W2952616728","https://openalex.org/W2962741697","https://openalex.org/W2962843773","https://openalex.org/W2963846996","https://openalex.org/W2970116058","https://openalex.org/W2974071289","https://openalex.org/W2979417040","https://openalex.org/W2995140942","https://openalex.org/W2996346140","https://openalex.org/W2996355630","https://openalex.org/W2999380901","https://openalex.org/W3001363766","https://openalex.org/W3001807593","https://openalex.org/W3004923758","https://openalex.org/W3013451997","https://openalex.org/W3019130148","https://openalex.org/W3023547440","https://openalex.org/W3026320104","https://openalex.org/W3029264758","https://openalex.org/W3034599929","https://openalex.org/W3035296331","https://openalex.org/W3042309366","https://openalex.org/W3044798755","https://openalex.org/W3099361686","https://openalex.org/W3100279624","https://openalex.org/W3101243562","https://openalex.org/W3105462247","https://openalex.org/W3118813946","https://openalex.org/W3121991495","https://openalex.org/W3123374861","https://openalex.org/W3123868826","https://openalex.org/W3125602241","https://openalex.org/W3125978365","https://openalex.org/W3159332253","https://openalex.org/W3162439866","https://openalex.org/W4232867745","https://openalex.org/W4239176442","https://openalex.org/W4285719527","https://openalex.org/W4288083800","https://openalex.org/W4288083802","https://openalex.org/W4288359825","https://openalex.org/W4300649495","https://openalex.org/W6638208828","https://openalex.org/W6777842384"],"related_works":["https://openalex.org/W2753773138","https://openalex.org/W3204354834","https://openalex.org/W6292469","https://openalex.org/W2801092833","https://openalex.org/W2901193592","https://openalex.org/W2118566385","https://openalex.org/W156167186","https://openalex.org/W2223796429","https://openalex.org/W3199802296","https://openalex.org/W2535465504"],"abstract_inverted_index":{"Datasets":[0],"that":[1,19,85,121,152],"power":[2],"machine":[3],"learning":[4],"are":[5,28],"often":[6,147],"used,":[7],"shared,":[8],"and":[9,36,55,65,88,96,125,135,150,168],"reused":[10],"with":[11,173],"little":[12],"visibility":[13],"into":[14,154],"the":[15,44,93,108,115,133,146,162],"processes":[16],"of":[17,48,99,114,137],"deliberation":[18],"led":[20],"to":[21,42,102,132],"their":[22],"creation.":[23],"As":[24],"artificial":[25,166],"intelligence":[26,167],"systems":[27],"increasingly":[29],"used":[30,56],"in":[31,57,160,165],"high-stakes":[32],"tasks,":[33],"system":[34],"development":[35,51,83,101,110,117],"deployment":[37],"practices":[38,106],"must":[39],"be":[40],"adapted":[41],"address":[43],"very":[45],"real":[46],"consequences":[47],"how":[49],"model":[50],"data":[52,116,139],"is":[53],"constructed":[54],"practice.":[58],"This":[59],"includes":[60],"greater":[61],"transparency":[62,84],"about":[63],"data,":[64],"accountability":[66,163],"for":[67,81],"decisions":[68,151],"made":[69],"when":[70],"developing":[71],"it.":[72],"In":[73],"this":[74],"paper,":[75],"we":[76],"introduce":[77],"a":[78,157,169],"rigorous":[79],"framework":[80,91,143],"dataset":[82,100,155],"supports":[86],"decision-making":[87],"accountability.":[89],"The":[90,141],"uses":[92],"cyclical,":[94],"infrastructural":[95],"engineering":[97],"nature":[98],"draw":[103],"on":[104,176],"best":[105],"from":[107],"software":[109],"lifecycle.":[111],"Each":[112],"stage":[113],"lifecycle":[118],"yields":[119],"documents":[120],"facilitate":[122],"improved":[123],"communication":[124],"decision-making,":[126],"as":[127,129],"well":[128],"drawing":[130],"attention":[131],"value":[134],"necessity":[136],"careful":[138],"work.":[140],"proposed":[142],"makes":[144],"visible":[145],"overlooked":[148],"work":[149,175],"go":[153],"creation,":[156],"critical":[158],"step":[159],"closing":[161],"gap":[164],"critical/necessary":[170],"resource":[171],"aligned":[172],"recent":[174],"auditing":[177],"processes.":[178]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":47},{"year":2023,"cited_by_count":62},{"year":2022,"cited_by_count":56},{"year":2021,"cited_by_count":32},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2021-03-15T00:00:00"}
