{"id":"https://openalex.org/W7151931987","doi":"https://doi.org/10.48550/arxiv.2604.05643","title":"Graph-Based Chain-of-Thought Pruning for Reducing Redundant Reflections in Reasoning LLMs","display_name":"Graph-Based Chain-of-Thought Pruning for Reducing Redundant Reflections in Reasoning LLMs","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7151931987","doi":"https://doi.org/10.48550/arxiv.2604.05643"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05643","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05643","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05643","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114214614","display_name":"Hongyuan Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yuan, Hongyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133176841","display_name":"Xinran He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Xinran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111334880","display_name":"Run Shao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Run","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058177086","display_name":"Bolei He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Bolei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109636384","display_name":"Xianwei Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Xianwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133189216","display_name":"Mengke Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Mengke","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133192321","display_name":"Qiutong Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Qiutong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130110993","display_name":"Haiwei Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haiwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133217266","display_name":"Haifeng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Haifeng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5114214614"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4359999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4359999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.16269999742507935,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.10660000145435333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.7078999876976013},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.7056000232696533},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.67330002784729},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4447999894618988},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.4447000026702881},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.361299991607666}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.7078999876976013},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.7056000232696533},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6901999711990356},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.67330002784729},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5077999830245972},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4447999894618988},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.4447000026702881},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4212000072002411},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.361299991607666},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.33809998631477356},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3231000006198883},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29510000348091125},{"id":"https://openalex.org/C74197172","wikidata":"https://www.wikidata.org/wiki/Q1195339","display_name":"Directed acyclic graph","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C65682993","wikidata":"https://www.wikidata.org/wiki/Q1056451","display_name":"Reflection (computer programming)","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C146380142","wikidata":"https://www.wikidata.org/wiki/Q1137726","display_name":"Directed graph","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05643","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05643","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05643","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05643","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5497830510139465,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Extending":[0],"CoT":[1,90,98],"through":[2],"RL":[3],"has":[4],"been":[5],"widely":[6],"used":[7],"to":[8,17,138,148,161],"enhance":[9],"the":[10,18,64,140,174],"reasoning":[11,37,176],"capabilities":[12],"of":[13,20,48],"LLMs.":[14],"However,":[15],"due":[16],"sparsity":[19],"reward":[21],"signals,":[22],"it":[23,76],"can":[24],"also":[25],"induce":[26],"undesirable":[27],"thinking":[28],"patterns":[29],"such":[30,49],"as":[31],"overthinking,":[32],"i.e.,":[33],"generating":[34],"redundant":[35,153],"intermediate":[36],"content.":[38],"In":[39],"this":[40,130],"work,":[41],"we":[42,86,94],"argue":[43],"that":[44,170],"a":[45,88,100,111,133],"major":[46],"source":[47],"redundancy":[50],"is":[51],"inefficient":[52],"reflection,":[53],"which":[54],"often":[55],"manifests":[56],"in":[57],"two":[58],"problematic":[59],"patterns:":[60],"Indiscriminate":[61],"Reflection,":[62,74],"where":[63,75],"model":[65],"performs":[66],"broad,":[67],"low-impact":[68],"checks":[69],"throughout":[70],"reasoning,":[71],"and":[72,109,155,166],"Repetitive":[73],"repeatedly":[77],"re-verifies":[78],"an":[79],"already":[80],"established":[81],"conclusion.":[82],"To":[83],"address":[84],"this,":[85],"introduce":[87],"graph-based":[89],"optimization":[91],"framework.":[92],"Specifically,":[93],"convert":[95],"each":[96],"linear":[97],"into":[99],"directed":[101],"acyclic":[102],"graph":[103],"(DAG)":[104],"with":[105,158],"explicit":[106],"dependency":[107],"edges,":[108],"design":[110],"dual":[112],"pruning":[113,116,124],"strategy:":[114],"branch-level":[115],"removes":[117],"weakly":[118],"contributing":[119],"reflection":[120],"branches,":[121],"while":[122,180],"depth-level":[123],"eliminates":[125],"late-stage":[126],"re-verification.":[127],"We":[128],"distill":[129],"behavior":[131],"via":[132],"three-stage":[134],"pipeline:":[135],"(1)":[136],"SFT":[137],"initialize":[139],"policy":[141],"on":[142],"pruned":[143],"concise":[144],"traces,":[145],"(2)":[146],"DPO":[147],"prefer":[149],"correct":[150],"but":[151],"less":[152],"trajectories,":[154],"(3)":[156],"GRPO":[157],"length":[159],"penalty":[160],"jointly":[162],"optimize":[163],"answer":[164],"correctness":[165],"efficiency.":[167],"Experiments":[168],"show":[169],"our":[171],"approach":[172],"reduces":[173],"average":[175],"tokens":[177],"by":[178],"42\\%":[179],"maintaining":[181],"or":[182],"improving":[183],"accuracy.":[184]},"counts_by_year":[],"updated_date":"2026-04-09T06:13:59.934233","created_date":"2026-04-09T00:00:00"}
