{"id":"https://openalex.org/W4403758888","doi":"https://doi.org/10.48550/arxiv.2409.13474","title":"Alternate Preference Optimization for Unlearning Factual Knowledge in Large Language Models","display_name":"Alternate Preference Optimization for Unlearning Factual Knowledge in Large Language Models","publication_year":2024,"publication_date":"2024-09-20","ids":{"openalex":"https://openalex.org/W4403758888","doi":"https://doi.org/10.48550/arxiv.2409.13474"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2409.13474","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.13474","pdf_url":"https://arxiv.org/pdf/2409.13474","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2409.13474","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009720858","display_name":"Anmol Mekala","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mekala, Anmol","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066026232","display_name":"Vineeth Dorna","orcid":"https://orcid.org/0009-0003-1050-9521"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dorna, Vineeth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017694321","display_name":"Shreya Dubey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dubey, Shreya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069691792","display_name":"Abhishek Lalwani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lalwani, Abhishek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037073689","display_name":"David Koleczek","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koleczek, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013555130","display_name":"Mukund Rungta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rungta, Mukund","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103789387","display_name":"Sadid A. Hasan","orcid":"https://orcid.org/0000-0002-5665-7752"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hasan, Sadid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5050874143","display_name":"Elita Lobo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lobo, Elita","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5009720858"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9323999881744385,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.6895338892936707},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5823435187339783},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37416720390319824},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.3395799398422241},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33955830335617065},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.27433085441589355},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14081764221191406},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.05532008409500122}],"concepts":[{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.6895338892936707},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5823435187339783},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37416720390319824},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3395799398422241},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33955830335617065},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.27433085441589355},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14081764221191406},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.05532008409500122}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2409.13474","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.13474","pdf_url":"https://arxiv.org/pdf/2409.13474","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2409.13474","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2409.13474","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2409.13474","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.13474","pdf_url":"https://arxiv.org/pdf/2409.13474","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332749","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403758888.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Machine":[0],"unlearning":[1,22,116],"aims":[2],"to":[3,39,43,95,102],"efficiently":[4],"eliminate":[5],"the":[6,14,18,44,86,97,103],"influence":[7],"of":[8,99],"specific":[9],"training":[10],"data,":[11],"known":[12],"as":[13],"forget":[15,45,87,104],"set,":[16,46],"from":[17],"model.":[19],"However,":[20],"existing":[21],"methods":[23],"for":[24],"Large":[25],"Language":[26],"Models":[27],"(LLMs)":[28],"face":[29],"a":[30,69],"critical":[31],"challenge:":[32],"they":[33],"rely":[34],"solely":[35],"on":[36,85],"negative":[37,79],"feedback":[38,80,84],"suppress":[40],"responses":[41,100],"related":[42,101],"which":[47,77],"often":[48],"results":[49],"in":[50],"nonsensical":[51],"or":[52],"inconsistent":[53],"outputs,":[54],"diminishing":[55],"model":[56,121,126],"utility":[57],"and":[58],"posing":[59],"potential":[60],"privacy":[61],"risks.":[62],"To":[63],"address":[64],"this":[65],"limitation,":[66],"we":[67,90],"propose":[68],"novel":[70],"approach":[71,111],"called":[72],"Alternate":[73],"Preference":[74],"Optimization":[75],"(AltPO),":[76],"combines":[78],"with":[81],"in-domain":[82],"positive":[83],"set.":[88,105],"Additionally,":[89],"introduce":[91],"new":[92],"evaluation":[93],"metrics":[94],"assess":[96],"quality":[98],"Extensive":[106],"experiments":[107],"show":[108],"that":[109],"our":[110],"not":[112],"only":[113],"enables":[114],"effective":[115],"but":[117],"also":[118],"avoids":[119],"undesirable":[120],"behaviors":[122],"while":[123],"maintaining":[124],"overall":[125],"performance.":[127],"Our":[128],"implementation":[129],"can":[130],"be":[131],"found":[132],"at":[133],"https://github.com/molereddy/Alternate-Preference-Optimization.":[134]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
