{"id":"https://openalex.org/W4416036809","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.265","title":"R-TOFU: Unlearning in Large Reasoning Models","display_name":"R-TOFU: Unlearning in Large Reasoning Models","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416036809","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.265"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.265","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.265","pdf_url":"https://aclanthology.org/2025.emnlp-main.265.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.265.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007040475","display_name":"Sangyeon Yoon","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Sangyeon Yoon","raw_affiliation_strings":["Department of Artificial Intelligence Yonsei University Seoul , Korea"],"affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence Yonsei University Seoul , Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119934311","display_name":"Wonje Jeung","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Wonje Jeung","raw_affiliation_strings":["Department of Artificial Intelligence Yonsei University Seoul , Korea"],"affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence Yonsei University Seoul , Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049196468","display_name":"Albert No","orcid":"https://orcid.org/0000-0002-6346-4182"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Albert No","raw_affiliation_strings":["Department of Artificial Intelligence Yonsei University Seoul , Korea"],"affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence Yonsei University Seoul , Korea","institution_ids":["https://openalex.org/I193775966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5007040475"],"corresponding_institution_ids":["https://openalex.org/I193775966"],"apc_list":null,"apc_paid":null,"fwci":2.3169,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91645898,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5239","last_page":"5258"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.4677000045776367,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.4677000045776367,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.07400000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.05550000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.6345999836921692},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6287000179290771},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5430999994277954},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.45840001106262207},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.36959999799728394},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.3472999930381775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7099999785423279},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.6345999836921692},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6287000179290771},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5430999994277954},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5084999799728394},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.45840001106262207},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.36959999799728394},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2888999879360199},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27649998664855957},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.26019999384880066},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2597000002861023}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.265","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.265","pdf_url":"https://aclanthology.org/2025.emnlp-main.265.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.265","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.265","pdf_url":"https://aclanthology.org/2025.emnlp-main.265.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2257911995","display_name":null,"funder_award_id":"RS-2020-II201361","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G6072120315","display_name":null,"funder_award_id":"funded","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G8582691448","display_name":null,"funder_award_id":"MOTIE, Korea","funder_id":"https://openalex.org/F4320321681","funder_display_name":"Ministry of Trade, Industry and Energy"},{"id":"https://openalex.org/G992484961","display_name":null,"funder_award_id":"Korea","funder_id":"https://openalex.org/F4320321681","funder_display_name":"Ministry of Trade, Industry and Energy"}],"funders":[{"id":"https://openalex.org/F4320321314","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96"},{"id":"https://openalex.org/F4320321681","display_name":"Ministry of Trade, Industry and Energy","ror":"https://ror.org/008nkqk13"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"},{"id":"https://openalex.org/F4320335489","display_name":"Institute for Information and Communications Technology Promotion","ror":"https://ror.org/01g0hqq23"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416036809.pdf","grobid_xml":"https://content.openalex.org/works/W4416036809.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Reasoning":[1],"Models":[2],"(LRMs)":[3],"embed":[4],"private":[5],"or":[6],"copyrighted":[7],"information":[8],"not":[9],"only":[10],"in":[11,29,84,159],"their":[12,163],"final":[13],"answers":[14],"but":[15],"also":[16],"throughout":[17],"multistep":[18],"chain-of-thought":[19],"(CoT)":[20],"traces,":[21],"making":[22],"reliable":[23],"unlearning":[24,44,158],"far":[25],"more":[26],"demanding":[27],"than":[28,109],"standard":[30],"LLMs.We":[31],"introduce":[32],"Reasoning-TOFU":[33],"(R-TOFU),":[34],"the":[35,135,144],"first":[36],"benchmark":[37],"tailored":[38],"to":[39,59,137],"this":[40],"setting.R-TOFU":[41],"augments":[42],"existing":[43],"tasks":[45],"with":[46],"realistic":[47],"CoT":[48],"annotations":[49],"and":[50,71,74,106,123,147,156,168],"provides":[51],"step-wise":[52],"metrics":[53],"that":[54,76,93],"expose":[55],"residual":[56],"knowledge":[57],"invisible":[58],"answer-level":[60],"checks.Using":[61],"R-TOFU,":[62],"we":[63,113],"carry":[64],"out":[65],"a":[66,90,100,115,151],"comprehensive":[67],"comparison":[68],"of":[69],"gradient-based":[70],"preference-optimization":[72],"baselines":[73],"show":[75],"conventional":[77],"answer-only":[78],"objectives":[79],"leave":[80],"substantial":[81],"forget":[82],"traces":[83],"reasoning.We":[85],"further":[86],"propose":[87],"Reasoned":[88],"IDK,":[89],"preferenceoptimization":[91],"variant":[92],"preserves":[94],"coherent":[95],"yet":[96],"inconclusive":[97],"reasoning,":[98],"achieving":[99],"stronger":[101],"balance":[102],"between":[103],"forgetting":[104],"efficacy":[105],"model":[107],"utility":[108],"earlier":[110],"refusal":[111],"styles.Finally,":[112],"identify":[114],"failure":[116],"mode:":[117],"decoding":[118,142],"variants":[119],"such":[120],"as":[121],"ZeroThink":[122],"LessThink":[124],"can":[125],"still":[126],"reveal":[127],"forgotten":[128],"content":[129],"despite":[130],"seemingly":[131],"successful":[132],"unlearning,":[133],"emphasizing":[134],"need":[136],"evaluate":[138],"models":[139],"under":[140],"diverse":[141],"settings.Together,":[143],"benchmark,":[145],"analysis,":[146],"new":[148],"baseline":[149],"establish":[150],"systematic":[152],"foundation":[153],"for":[154],"studying":[155],"improving":[157],"LRMs":[160],"while":[161],"preserving":[162],"reasoning":[164],"capabilities.We":[165],"release":[166],"R-TOFU":[167],"code":[169],"at":[170],"https://ai-isl.github.io/r-tofu.":[171]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-11-08T00:00:00"}
