{"id":"https://openalex.org/W4405656930","doi":"https://doi.org/10.48550/arxiv.2408.12055","title":"Aligning (Medical) LLMs for (Counterfactual) Fairness","display_name":"Aligning (Medical) LLMs for (Counterfactual) Fairness","publication_year":2024,"publication_date":"2024-08-22","ids":{"openalex":"https://openalex.org/W4405656930","doi":"https://doi.org/10.48550/arxiv.2408.12055"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2408.12055","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.12055","pdf_url":"https://arxiv.org/pdf/2408.12055","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2408.12055","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080077033","display_name":"Raphael Poulain","orcid":"https://orcid.org/0000-0001-9893-5469"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poulain, Raphael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087143174","display_name":"Hamed Fayyaz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fayyaz, Hamed","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044208559","display_name":"Rahmatollah Beheshti","orcid":"https://orcid.org/0000-0001-8912-3063"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beheshti, Rahmatollah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.8787000179290771,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.8787000179290771,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13417","display_name":"Biomedical Ethics and Regulation","score":0.777999997138977,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.8416744470596313},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.3363155126571655},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.3345280885696411},{"id":"https://openalex.org/keywords/actuarial-science","display_name":"Actuarial science","score":0.33142292499542236},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.20109230279922485},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.10168859362602234}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.8416744470596313},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3363155126571655},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.3345280885696411},{"id":"https://openalex.org/C162118730","wikidata":"https://www.wikidata.org/wiki/Q1128453","display_name":"Actuarial science","level":1,"score":0.33142292499542236},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.20109230279922485},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.10168859362602234}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2408.12055","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.12055","pdf_url":"https://arxiv.org/pdf/2408.12055","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2408.12055","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2408.12055","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2408.12055","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.12055","pdf_url":"https://arxiv.org/pdf/2408.12055","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4965281027","display_name":null,"funder_award_id":"U54-GM104941","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G6576323535","display_name":null,"funder_award_id":"GM104941","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320310598","display_name":"Amazon Web Services","ror":"https://ror.org/04mv4n011"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405656930.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3031052312","https://openalex.org/W4389568370","https://openalex.org/W3201448254","https://openalex.org/W3032375762","https://openalex.org/W4286970243","https://openalex.org/W1995515455","https://openalex.org/W2080531066"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"emerged":[5],"as":[6],"promising":[7],"solutions":[8],"for":[9,63,110],"a":[10,58,67,72,90,116],"variety":[11],"of":[12,27,35,104],"medical":[13,45,111],"and":[14,40,102],"clinical":[15],"decision":[16],"support":[17],"applications.":[18,112],"However,":[19],"LLMs":[20,65,108],"are":[21],"often":[22],"subject":[23],"to":[24,32,48,77,88,93,98,120],"different":[25,129],"types":[26],"biases,":[28],"which":[29],"can":[30],"lead":[31],"unfair":[33,123],"treatment":[34],"individuals,":[36],"worsening":[37],"health":[38],"disparities,":[39],"reducing":[41,146],"trust":[42],"in":[43,53,107,125,144],"AI-augmented":[44],"tools.":[46],"Aiming":[47],"address":[49],"this":[50,54],"important":[51],"issue,":[52],"study,":[55],"we":[56,82],"present":[57],"new":[59],"model":[60],"alignment":[61],"approach":[62],"aligning":[64],"using":[66],"preference":[68],"optimization":[69],"method":[70,141],"within":[71],"knowledge":[73],"distillation":[74],"framework.":[75],"Prior":[76],"presenting":[78],"our":[79,94,139],"proposed":[80],"method,":[81],"first":[83],"use":[84],"an":[85],"evaluation":[86,97],"framework":[87],"conduct":[89],"comprehensive":[91],"(largest":[92],"knowledge)":[95],"empirical":[96],"reveal":[99],"the":[100,122,133],"type":[101],"nature":[103],"existing":[105],"biases":[106],"used":[109],"We":[113,136],"then":[114],"offer":[115],"bias":[117],"mitigation":[118,140],"technique":[119],"reduce":[121],"patterns":[124],"LLM":[126],"outputs":[127],"across":[128],"subgroups":[130],"identified":[131],"by":[132],"protected":[134],"attributes.":[135],"show":[137],"that":[138],"is":[142,152],"effective":[143],"significantly":[145],"observed":[147],"biased":[148],"patterns.":[149],"Our":[150],"code":[151],"publicly":[153],"available":[154],"at":[155],"\\url{https://github.com/healthylaife/FairAlignmentLLM}.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
