{"id":"https://openalex.org/W7162411513","doi":"https://doi.org/10.48550/arxiv.2605.24005","title":"LC-ERD: Mining Latent Logic for Self-Evolving Reasoning via Consistency-Regulated Reward Decomposition","display_name":"LC-ERD: Mining Latent Logic for Self-Evolving Reasoning via Consistency-Regulated Reward Decomposition","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7162411513","doi":"https://doi.org/10.48550/arxiv.2605.24005"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.24005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.24005","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137065814","display_name":"Yanyu Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yanyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137067945","display_name":"Jiyue Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jiyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137029212","display_name":"Dianzhi Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Dianzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137050528","display_name":"Zheng Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Zheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137035443","display_name":"Jiahong Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiahong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137051472","display_name":"Jiaming Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Jiaming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137023337","display_name":"Xiao Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Xiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095747638","display_name":"Jinhu Qi","orcid":"https://orcid.org/0009-0006-5544-4786"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Jinhu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137050013","display_name":"Yu Li","orcid":"https://orcid.org/0000-0002-4993-7377"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137064748","display_name":"Yifei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yifei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137019436","display_name":"Irwin King","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"King, Irwin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.29319998621940613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.29319998621940613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.18709999322891235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.12999999523162842,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/non-monotonic-logic","display_name":"Non-monotonic logic","score":0.6194999814033508},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5019999742507935},{"id":"https://openalex.org/keywords/frame-problem","display_name":"Frame problem","score":0.3555000126361847},{"id":"https://openalex.org/keywords/subjective-logic","display_name":"Subjective logic","score":0.3440000116825104},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.3321000039577484},{"id":"https://openalex.org/keywords/deductive-reasoning","display_name":"Deductive reasoning","score":0.3310999870300293},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.3188000023365021},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.31189998984336853}],"concepts":[{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.6194999814033508},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6126999855041504},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6075999736785889},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5019999742507935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44200000166893005},{"id":"https://openalex.org/C5065155","wikidata":"https://www.wikidata.org/wiki/Q1185775","display_name":"Frame problem","level":2,"score":0.3555000126361847},{"id":"https://openalex.org/C113839178","wikidata":"https://www.wikidata.org/wiki/Q7631418","display_name":"Subjective logic","level":3,"score":0.3440000116825104},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C97364631","wikidata":"https://www.wikidata.org/wiki/Q484284","display_name":"Deductive reasoning","level":2,"score":0.3310999870300293},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.31189998984336853},{"id":"https://openalex.org/C32241873","wikidata":"https://www.wikidata.org/wiki/Q236975","display_name":"Classical logic","level":2,"score":0.30469998717308044},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.271699994802475},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2703999876976013},{"id":"https://openalex.org/C160236029","wikidata":"https://www.wikidata.org/wiki/Q842421","display_name":"Default logic","level":5,"score":0.2700999975204468},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.2565999925136566},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.24005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.24005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"evolution":[1],"of":[2,13],"Large":[3],"Language":[4],"Model":[5],"(LLM)":[6],"reasoning":[7,69,123,160],"is":[8,168],"bottlenecked":[9],"by":[10,110,163],"the":[11,114,122,134],"scarcity":[12],"high-quality":[14],"process":[15],"data.":[16],"While":[17],"self-alignment":[18,99],"via":[19,34],"endogenous":[20],"rewards":[21,38],"offers":[22],"a":[23,46,96,106,127,146],"solution,":[24],"mining":[25],"valid":[26],"supervision":[27],"faces":[28],"three":[29],"challenges:":[30],"(1)":[31],"Label":[32],"Noise":[33],"Mimetic":[35],"Bias,":[36],"where":[37,56,77],"prioritize":[39],"statistical":[40],"likelihood":[41],"over":[42],"logical":[43],"truth,":[44],"creating":[45],"\"correctness":[47],"illusion\"":[48],"that":[49],"masks":[50],"compounding":[51],"errors;":[52],"(2)":[53],"Coarse-Grained":[54],"Supervision,":[55],"sparse":[57],"global":[58],"outcomes":[59],"(e.g.,":[60],"in":[61],"GRPO)":[62],"fail":[63,79],"to":[64,80,120,137],"provide":[65],"granular":[66],"guidance,":[67],"treating":[68],"chains":[70],"as":[71,100],"monolithic;":[72],"and":[73,125,155],"(3)":[74],"Distributional":[75],"Collapse,":[76],"signals":[78],"generalize":[81],"without":[82],"amplifying":[83],"pre-training":[84],"biases.":[85],"To":[86],"address":[87],"these,":[88],"we":[89],"introduce":[90,126],"LC-ERD":[91,144],"(Logic-Consistent":[92],"Endogenous":[93],"Reward":[94],"Decomposition),":[95],"framework":[97],"framing":[98],"latent":[101],"structure":[102],"mining.":[103],"We":[104],"derive":[105],"Variational":[107],"Logic":[108,117],"Potential":[109],"aggregating":[111],"consensus":[112],"from":[113],"model's":[115],"Latent":[116],"Expertise":[118],"(LLE)":[119],"denoise":[121],"manifold,":[124],"Multi-Agent":[128],"Value":[129],"Decomposition":[130],"protocol":[131],"based":[132],"on":[133],"IGM":[135],"principle":[136],"quantify":[138],"individual":[139],"step":[140],"utility.":[141],"Experiments":[142],"show":[143],"delivers":[145],"robust":[147],"self-evolution":[148],"path,":[149],"uncovering":[150],"trade-offs":[151],"between":[152],"logic":[153],"consistency":[154],"accuracy":[156],"while":[157],"identifying":[158],"high-value":[159],"patterns":[161],"missed":[162],"standard":[164],"rewards.":[165],"Our":[166],"code":[167],"available":[169],"at":[170],"https://github.com/LC-ERD-repo/LC-ERD.":[171]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
