{"id":"https://openalex.org/W4385474267","doi":"https://doi.org/10.48550/arxiv.2307.16526","title":"No Fair Lunch: A Causal Perspective on Dataset Bias in Machine Learning for Medical Imaging","display_name":"No Fair Lunch: A Causal Perspective on Dataset Bias in Machine Learning for Medical Imaging","publication_year":2023,"publication_date":"2023-07-31","ids":{"openalex":"https://openalex.org/W4385474267","doi":"https://doi.org/10.48550/arxiv.2307.16526"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2307.16526","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.16526","pdf_url":"https://arxiv.org/pdf/2307.16526","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2307.16526","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046046780","display_name":"Charles Jones","orcid":"https://orcid.org/0000-0001-5884-6760"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jones, Charles","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037843387","display_name":"Daniel C. Castro","orcid":"https://orcid.org/0000-0002-6829-7045"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Castro, Daniel C.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028172491","display_name":"Fabio De Sousa Ribeiro","orcid":"https://orcid.org/0000-0002-6195-5658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ribeiro, Fabio De Sousa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038400548","display_name":"Ozan Oktay","orcid":"https://orcid.org/0000-0003-2976-0874"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oktay, Ozan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063981686","display_name":"Melissa D. McCradden","orcid":"https://orcid.org/0000-0002-6476-2165"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McCradden, Melissa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5007222325","display_name":"Ben Glocker","orcid":"https://orcid.org/0000-0002-4897-9356"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glocker, Ben","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5046046780"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9825000166893005,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10804","display_name":"Health Systems, Economic Evaluations, Quality of Life","score":0.9768000245094299,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.8280602097511292},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6278625130653381},{"id":"https://openalex.org/keywords/presentation","display_name":"Presentation (obstetrics)","score":0.5386443138122559},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5289179086685181},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5066776871681213},{"id":"https://openalex.org/keywords/debiasing","display_name":"Debiasing","score":0.48553869128227234},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46548524498939514},{"id":"https://openalex.org/keywords/confirmation-bias","display_name":"Confirmation bias","score":0.4304213523864746},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.3569442927837372},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.23986852169036865},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.14861220121383667},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.11466255784034729}],"concepts":[{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.8280602097511292},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6278625130653381},{"id":"https://openalex.org/C2777601897","wikidata":"https://www.wikidata.org/wiki/Q3409113","display_name":"Presentation (obstetrics)","level":2,"score":0.5386443138122559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5289179086685181},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5066776871681213},{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.48553869128227234},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46548524498939514},{"id":"https://openalex.org/C79585631","wikidata":"https://www.wikidata.org/wiki/Q431498","display_name":"Confirmation bias","level":2,"score":0.4304213523864746},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3569442927837372},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.23986852169036865},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.14861220121383667},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.11466255784034729},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2307.16526","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.16526","pdf_url":"https://arxiv.org/pdf/2307.16526","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2307.16526","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2307.16526","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2307.16526","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.16526","pdf_url":"https://arxiv.org/pdf/2307.16526","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8199999928474426,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320308943","display_name":"Microsoft Research","ror":"https://ror.org/00d0nc645"},{"id":"https://openalex.org/F4320320005","display_name":"Royal Academy of Engineering","ror":"https://ror.org/0526snb40"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385474267.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3135024063","https://openalex.org/W2733554571","https://openalex.org/W4383620860","https://openalex.org/W2797318137","https://openalex.org/W3125546169","https://openalex.org/W4292260720","https://openalex.org/W2549718520","https://openalex.org/W2982921892","https://openalex.org/W1993548098","https://openalex.org/W4377021792"],"abstract_inverted_index":{"As":[0],"machine":[1],"learning":[2],"methods":[3,26,81],"gain":[4],"prominence":[5],"within":[6],"clinical":[7],"decision-making,":[8],"addressing":[9],"fairness":[10,101],"concerns":[11],"becomes":[12],"increasingly":[13],"urgent.":[14],"Despite":[15],"considerable":[16],"work":[17],"dedicated":[18],"to":[19],"detecting":[20],"and":[21,72,86,110],"ameliorating":[22],"algorithmic":[23,40],"bias,":[24,41],"today's":[25],"are":[27],"deficient":[28],"with":[29],"potentially":[30],"harmful":[31],"consequences.":[32],"Our":[33,74],"causal":[34,63,75],"perspective":[35],"sheds":[36],"new":[37],"light":[38],"on":[39],"highlighting":[42],"how":[43,78],"different":[44,55],"sources":[45],"of":[46,62,90,108],"dataset":[47],"bias":[48,64],"may":[49],"appear":[50],"indistinguishable":[51],"yet":[52],"require":[53],"substantially":[54],"mitigation":[56,80],"strategies.":[57],"We":[58,92],"introduce":[59],"three":[60],"families":[61],"mechanisms":[65],"stemming":[66],"from":[67],"disparities":[68],"in":[69,102],"prevalence,":[70],"presentation,":[71],"annotation.":[73],"analysis":[76],"underscores":[77],"current":[79],"tackle":[82],"only":[83],"a":[84,94],"narrow":[85],"often":[87],"unrealistic":[88],"subset":[89],"scenarios.":[91],"provide":[93],"practical":[95],"three-step":[96],"framework":[97],"for":[98],"reasoning":[99],"about":[100],"medical":[103],"imaging,":[104],"supporting":[105],"the":[106],"development":[107],"safe":[109],"equitable":[111],"AI":[112],"prediction":[113],"models.":[114]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2023-08-02T00:00:00"}
