{"id":"https://openalex.org/W7162645286","doi":"https://doi.org/10.48550/arxiv.2605.27375","title":"LCO: LLM-based Constraint Optimization for Safer Agentic LLMs in Real-world Tasks","display_name":"LCO: LLM-based Constraint Optimization for Safer Agentic LLMs in Real-world Tasks","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7162645286","doi":"https://doi.org/10.48550/arxiv.2605.27375"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27375","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137195034","display_name":"Jiayong Wan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wan, Jiayong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137221117","display_name":"Jiawei Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiawei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137290194","display_name":"Zhaoxia Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Zhaoxia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137255999","display_name":"Liu Shuyuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shuyuan, Liu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137281086","display_name":"Hang Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Hang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.17550000548362732,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.17550000548362732,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.15320000052452087,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.12269999831914902,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.640999972820282},{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.593999981880188},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.5856999754905701},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5799999833106995},{"id":"https://openalex.org/keywords/crossover","display_name":"Crossover","score":0.5608000159263611},{"id":"https://openalex.org/keywords/mutation","display_name":"Mutation","score":0.4153999984264374},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.3903999924659729}],"concepts":[{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.640999972820282},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6022999882698059},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.593999981880188},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5799999833106995},{"id":"https://openalex.org/C122507166","wikidata":"https://www.wikidata.org/wiki/Q628906","display_name":"Crossover","level":2,"score":0.5608000159263611},{"id":"https://openalex.org/C501734568","wikidata":"https://www.wikidata.org/wiki/Q42918","display_name":"Mutation","level":3,"score":0.4153999984264374},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.3903999924659729},{"id":"https://openalex.org/C55660270","wikidata":"https://www.wikidata.org/wiki/Q5164377","display_name":"Constrained optimization","level":2,"score":0.3521000146865845},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3517000079154968},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.3422999978065491},{"id":"https://openalex.org/C2777615720","wikidata":"https://www.wikidata.org/wiki/Q11888847","display_name":"Prioritization","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.30730000138282776},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.30309998989105225},{"id":"https://openalex.org/C68781425","wikidata":"https://www.wikidata.org/wiki/Q2052203","display_name":"Multi-objective optimization","level":2,"score":0.2953000068664551},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2842999994754791},{"id":"https://openalex.org/C2778068216","wikidata":"https://www.wikidata.org/wiki/Q55019500","display_name":"Malice","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25609999895095825}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.5415792465209961,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4,44],"increasingly":[5],"acting":[6],"as":[7,50],"autonomous":[8],"agents,":[9],"but":[10,57],"their":[11,30],"continuous":[12],"interaction":[13],"with":[14],"the":[15,59,91,115,144,155,164,170],"environment":[16],"can":[17],"lead":[18],"to":[19,32,46,93,113],"in-context":[20],"reward":[21],"hacking":[22],"(ICRH),":[23],"a":[24,73,119,151],"phenomenon":[25],"where":[26],"LLMs":[27],"iteratively":[28],"optimize":[29],"behavior":[31],"maximize":[33],"proxy":[34],"objectives,":[35],"inadvertently":[36],"producing":[37],"harmful":[38],"side":[39],"effects.":[40],"Existing":[41],"defense":[42],"methods":[43],"insufficient":[45],"address":[47],"this":[48,65],"risk,":[49],"ICRH":[51,78,134,171],"arises":[52],"not":[53],"from":[54,58],"adversarial":[55],"inputs":[56],"model's":[60,116],"own":[61],"over-optimization.":[62],"To":[63],"mitigate":[64],"issue,":[66],"we":[67],"propose":[68],"\\textbf{LLM-based":[69],"Constraint":[70],"Optimization":[71],"(LCO)},":[72],"framework":[74],"that":[75,130],"effectively":[76],"reduces":[77,169],"without":[79,179],"model":[80],"fine-tuning.":[81],"LCO":[82,131,149],"consists":[83],"of":[84],"two":[85],"modules:":[86],"\\textit{self-thought":[87],"module},":[88,106],"which":[89,107],"guides":[90],"LLM":[92],"proactively":[94],"deliberate":[95],"and":[96,103,111,138],"integrate":[97],"potential":[98],"safety":[99,177],"constraints":[100],"before":[101],"execution;":[102],"\\textit{evolutionary":[104],"sampling":[105],"employs":[108],"LLM-based":[109],"crossover":[110],"mutation":[112],"constrain":[114],"actions":[117],"within":[118],"safe":[120],"solution":[121],"space":[122],"while":[123,162],"maintaining":[124],"task":[125,181],"performance.":[126,182],"Experimental":[127],"results":[128],"demonstrate":[129],"substantially":[132],"alleviates":[133],"in":[135,154],"both":[136],"output-refine":[137],"policy-refine":[139],"scenarios.":[140],"In":[141],"particular,":[142],"on":[143,160,163],"tweet":[145],"engagement":[146],"optimization":[147,166],"task,":[148],"achieves":[150],"39%":[152],"reduction":[153],"Toxicity":[156],"Growth":[157],"Rate":[158,173],"(TGR)":[159],"GPT-4,":[161],"policy":[165],"benchmark,":[167],"it":[168],"Occurrence":[172],"by":[174],"15.23%,":[175],"demonstrating":[176],"improvement":[178],"sacrificing":[180]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-29T00:00:00"}
