{"id":"https://openalex.org/W7161573609","doi":"https://doi.org/10.48550/arxiv.2605.16113","title":"DebiasRAG: A Tuning-Free Path to Fair Generation in Large Language Models through Retrieval-Augmented Generation","display_name":"DebiasRAG: A Tuning-Free Path to Fair Generation in Large Language Models through Retrieval-Augmented Generation","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7161573609","doi":"https://doi.org/10.48550/arxiv.2605.16113"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.16113","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16113","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.16113","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086748292","display_name":"Rui Chu","orcid":"https://orcid.org/0009-0002-4094-659X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085461777","display_name":"Bingyin Zhao","orcid":"https://orcid.org/0000-0003-0372-8198"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Bingyin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130406679","display_name":"Thanh Quoc Hung Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Le, Thanh Quoc Hung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076982723","display_name":"Duy C. Hoang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoang, Duy Cao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136361469","display_name":"Huawei Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Huawei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136364815","display_name":"Ping Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Ping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136361965","display_name":"Weijie Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Weijie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080642445","display_name":"Khoa D. Doan","orcid":"https://orcid.org/0000-0002-1610-8206"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Doan, Khoa D","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5071172709","display_name":"Yingjie Lao","orcid":"https://orcid.org/0000-0002-9413-2455"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lao, Yingjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.37209999561309814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.37209999561309814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.12430000305175781,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.07980000227689743,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/debiasing","display_name":"Debiasing","score":0.9933000206947327},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.659500002861023},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5512999892234802},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.535099983215332},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.47350001335144043},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4320000112056732},{"id":"https://openalex.org/keywords/natural-language-generation","display_name":"Natural language generation","score":0.36970001459121704}],"concepts":[{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.9933000206947327},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7476000189781189},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.659500002861023},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5512999892234802},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.535099983215332},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.47350001335144043},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4320000112056732},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37700000405311584},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.36970001459121704},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3546000123023987},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3165000081062317},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3098999857902527},{"id":"https://openalex.org/C2779456664","wikidata":"https://www.wikidata.org/wiki/Q972162","display_name":"Specularity","level":3,"score":0.30410000681877136},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3034000098705292},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2809000015258789},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C77660490","wikidata":"https://www.wikidata.org/wiki/Q244916","display_name":"Intermediate language","level":3,"score":0.26980000734329224},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.25920000672340393}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.16113","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16113","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.16113","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16113","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5351596474647522}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"have":[4,56],"achieved":[5],"unprecedented":[6],"success":[7],"due":[8],"to":[9,38,50,62,78,165],"their":[10],"exceptional":[11],"generative":[12],"capabilities.":[13],"However,":[14],"because":[15],"they":[16,24,83],"depend":[17],"on":[18,118],"knowledge":[19,77],"encapsulated":[20],"from":[21,211],"training":[22,73],"corpora,":[23],"may":[25,84],"produce":[26],"hallucinations,":[27],"stereotypes,":[28],"and":[29,44,59,91,112,151],"socially":[30],"biased":[31],"content.":[32],"In":[33,103],"particular,":[34],"LLMs":[35,90],"are":[36,47,175,193],"prone":[37],"prejudiced":[39],"responses":[40],"involving":[41],"race,":[42],"gender,":[43],"age,":[45],"which":[46,192],"collectively":[48],"referred":[49],"as":[51,133,195,218],"social":[52],"biases.":[53],"Prior":[54],"studies":[55],"used":[57],"fine-tuning":[58],"prompt":[60],"engineering":[61],"mitigate":[63],"such":[64,132,217],"biases":[65],"in":[66],"LLMs,":[67,131],"but":[68],"these":[69],"methods":[70],"require":[71],"additional":[72,196],"resources":[74],"or":[75],"domain":[76],"design":[79],"the":[80,86,94,127,166,172,179,183,212],"framework.":[81],"Moreover,":[82],"degrade":[85],"original":[87],"capabilities":[88],"of":[89,130,138],"often":[92],"overlook":[93],"need":[95],"for":[96,100,199],"dynamic":[97,113],"debiasing":[98,115,143,190],"contexts":[99,163,174,210],"fairer":[101],"inference.":[102],"this":[104],"paper,":[105],"we":[106],"propose":[107],"DebiasRAG,":[108],"a":[109,203,219],"novel":[110],"tuning-free":[111],"query-specific":[114,142,184],"framework":[116],"based":[117],"retrieval-augmented":[119],"generation":[120],"(RAG).":[121],"DebiasRAG":[122,136,159,180,187],"improves":[123],"fairness":[124,197],"while":[125],"preserving":[126],"intrinsic":[128],"properties":[129],"representation":[134],"ability.":[135],"consists":[137],"three":[139],"stages:":[140],"(1)":[141],"candidate":[144,148],"generation;":[145],"(2)":[146],"context":[147,155],"pool":[149],"construction;":[150],"(3)":[152],"gradient-updated":[153],"debiasing-guided":[154],"piece":[156],"reranking.":[157],"First,":[158],"leverages":[160],"self-diagnosed":[161],"bias":[162,173,185],"relevant":[164],"query":[167],"through":[168],"regular":[169,204,213],"retrieval,":[170],"where":[171],"prepared":[176],"offline":[177],"by":[178],"provider.":[181],"Given":[182],"contexts,":[186,191],"reversely":[188],"produces":[189,208],"provided":[194],"constraints":[198],"LLM":[200],"outputs.":[201],"Second,":[202],"RAG":[205,214],"retrieval":[206],"process":[207],"query-related":[209],"document":[215],"database,":[216],"chunked":[220],"Wikipedia":[221],"dataset.":[222]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-19T00:00:00"}
