{"id":"https://openalex.org/W3163078977","doi":"https://doi.org/10.1145/3411764.3445423","title":"The Disagreement Deconvolution: Bringing Machine Learning Performance Metrics In Line With Reality","display_name":"The Disagreement Deconvolution: Bringing Machine Learning Performance Metrics In Line With Reality","publication_year":2021,"publication_date":"2021-05-06","ids":{"openalex":"https://openalex.org/W3163078977","doi":"https://doi.org/10.1145/3411764.3445423","mag":"3163078977"},"language":"en","primary_location":{"id":"doi:10.1145/3411764.3445423","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3411764.3445423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026198819","display_name":"Mitchell Gordon","orcid":"https://orcid.org/0000-0003-1008-2321"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mitchell L. Gordon","raw_affiliation_strings":["Computer Science Department, Stanford University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, United States","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031278789","display_name":"Kaitlyn Zhou","orcid":"https://orcid.org/0000-0001-8804-8161"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaitlyn Zhou","raw_affiliation_strings":["Computer Science Department, Stanford University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, United States","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011076157","display_name":"Kayur Patel","orcid":"https://orcid.org/0009-0009-5294-0727"},"institutions":[{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kayur Patel","raw_affiliation_strings":["Apple Inc., United States"],"affiliations":[{"raw_affiliation_string":"Apple Inc., United States","institution_ids":["https://openalex.org/I4210153776"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015518638","display_name":"Tatsunori Hashimoto","orcid":"https://orcid.org/0000-0003-0521-5855"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tatsunori Hashimoto","raw_affiliation_strings":["Computer Science Department, Stanford University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, United States","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076189854","display_name":"Michael S. Bernstein","orcid":"https://orcid.org/0000-0001-8020-9434"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael S. Bernstein","raw_affiliation_strings":["Computer Science Department, Stanford University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, United States","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5026198819"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":11.3391,"has_fulltext":false,"cited_by_count":97,"citation_normalized_percentile":{"value":0.9874209,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/deconvolution","display_name":"Deconvolution","score":0.7718034982681274},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.688517689704895},{"id":"https://openalex.org/keywords/line","display_name":"Line (geometry)","score":0.5446991920471191},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5291160941123962},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49464842677116394},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.20844361186027527},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1611766517162323}],"concepts":[{"id":"https://openalex.org/C174576160","wikidata":"https://www.wikidata.org/wiki/Q1183700","display_name":"Deconvolution","level":2,"score":0.7718034982681274},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.688517689704895},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.5446991920471191},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5291160941123962},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49464842677116394},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20844361186027527},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1611766517162323},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3411764.3445423","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3411764.3445423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.47999998927116394,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W621249151","https://openalex.org/W1501005121","https://openalex.org/W1517046895","https://openalex.org/W1565765697","https://openalex.org/W1702329404","https://openalex.org/W1967815273","https://openalex.org/W1977975426","https://openalex.org/W1989630473","https://openalex.org/W1992984099","https://openalex.org/W2003238113","https://openalex.org/W2018260704","https://openalex.org/W2049947514","https://openalex.org/W2059216172","https://openalex.org/W2097248932","https://openalex.org/W2108598243","https://openalex.org/W2125943921","https://openalex.org/W2143244606","https://openalex.org/W2143539737","https://openalex.org/W2158880898","https://openalex.org/W2187291759","https://openalex.org/W2290009368","https://openalex.org/W2292070666","https://openalex.org/W2560674852","https://openalex.org/W2563826943","https://openalex.org/W2574781439","https://openalex.org/W2585712495","https://openalex.org/W2607311634","https://openalex.org/W2730390070","https://openalex.org/W2741620441","https://openalex.org/W2742330194","https://openalex.org/W2767546953","https://openalex.org/W2769041395","https://openalex.org/W2795959033","https://openalex.org/W2796239588","https://openalex.org/W2798706400","https://openalex.org/W2804228850","https://openalex.org/W2809806295","https://openalex.org/W2896881735","https://openalex.org/W2899134503","https://openalex.org/W2902799923","https://openalex.org/W2902998547","https://openalex.org/W2912457762","https://openalex.org/W2916904544","https://openalex.org/W2920807444","https://openalex.org/W2922234936","https://openalex.org/W2936750472","https://openalex.org/W2938086271","https://openalex.org/W2942399136","https://openalex.org/W2945599316","https://openalex.org/W2954992865","https://openalex.org/W2959716049","https://openalex.org/W2963748066","https://openalex.org/W2969896603","https://openalex.org/W2985347336","https://openalex.org/W2987755095","https://openalex.org/W2991138171","https://openalex.org/W2991771198","https://openalex.org/W2993013587","https://openalex.org/W2994507840","https://openalex.org/W3005295611","https://openalex.org/W3036998917","https://openalex.org/W3080732897","https://openalex.org/W3080883390","https://openalex.org/W3099917429","https://openalex.org/W3114228236","https://openalex.org/W3121499412","https://openalex.org/W3160042174","https://openalex.org/W4243695588"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Machine":[0],"learning":[1,74,141],"classifiers":[2],"for":[3,56,143],"human-facing":[4,52,139],"tasks":[5],"such":[6,17,32],"as":[7,18,33],"comment":[8,148],"toxicity":[9,149],"and":[10,37,80,105],"misinformation":[11],"often":[12],"score":[13],"highly":[14],"on":[15,146],"metrics":[16,31,76,132],"ROC":[19,34,157],"AUC":[20],"but":[21],"are":[22,39],"received":[23],"poorly":[24],"in":[25,90],"practice.":[26],"Why":[27],"this":[28,63],"gap?":[29],"Today,":[30],"AUC,":[35],"precision,":[36],"recall":[38],"used":[40],"to":[41,59,111,123,155],"measure":[42],"technical":[43],"performance;":[44],"however,":[45],"human-computer":[46],"interaction":[47],"observes":[48],"that":[49,69,130],"evaluation":[50],"of":[51,82,137],"systems":[53],"should":[54],"account":[55],"people\u2019s":[57],"reactions":[58],"the":[60,78,112,120,135],"system.":[61],"In":[62],"paper,":[64],"we":[65,128],"introduce":[66],"a":[67,147],"transformation":[68],"more":[70],"closely":[71],"aligns":[72],"machine":[73,140],"classification":[75],"with":[77],"values":[79],"methods":[81],"user-facing":[83],"performance":[84,136,145],"measures.":[85],"The":[86],"disagreement":[87,121],"deconvolution":[88,122],"takes":[89],"any":[91],"multi-annotator":[92],"(e.g.,":[93],"crowdsourced)":[94],"dataset,":[95],"disentangles":[96],"stable":[97,114],"opinions":[98,115],"from":[99,116,153],"noise":[100],"by":[101],"estimating":[102],"intra-annotator":[103],"consistency,":[104],"compares":[106],"each":[107,117],"test":[108],"set":[109],"prediction":[110],"individual":[113],"annotator.":[118],"Applying":[119],"existing":[124],"social":[125],"computing":[126],"datasets,":[127],"find":[129],"current":[131],"dramatically":[133],"overstate":[134],"many":[138],"tasks:":[142],"example,":[144],"task":[150],"is":[151],"corrected":[152],".95":[154],".73":[156],"AUC.":[158]},"counts_by_year":[{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":17},{"year":2023,"cited_by_count":29},{"year":2022,"cited_by_count":24},{"year":2021,"cited_by_count":11}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
