{"id":"https://openalex.org/W7134060452","doi":"https://doi.org/10.48550/arxiv.2603.04900","title":"EvoTool: Self-Evolving Tool-Use Policy Optimization in LLM Agents via Blame-Aware Mutation and Diversity-Aware Selection","display_name":"EvoTool: Self-Evolving Tool-Use Policy Optimization in LLM Agents via Blame-Aware Mutation and Diversity-Aware Selection","publication_year":2026,"publication_date":"2026-03-05","ids":{"openalex":"https://openalex.org/W7134060452","doi":"https://doi.org/10.48550/arxiv.2603.04900"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.04900","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128253596","display_name":"Shuo Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Shuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084419965","display_name":"Soyeon Caren Han","orcid":"https://orcid.org/0000-0002-1948-6819"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Soyeon Caren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128233976","display_name":"Xueqi Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Xueqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128220752","display_name":"Yan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102590170","display_name":"Mohammad Reza Ghasemi Madani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Madani, Mohammad Reza Ghasemi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128276285","display_name":"Eduard Hovy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hovy, Eduard","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5128253596"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.31679999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.31679999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.05979999899864197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.059300001710653305,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6552000045776367},{"id":"https://openalex.org/keywords/blame","display_name":"Blame","score":0.5738999843597412},{"id":"https://openalex.org/keywords/mutation","display_name":"Mutation","score":0.5410000085830688},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.49790000915527344},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.49410000443458557},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.3598000109195709}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.715399980545044},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6552000045776367},{"id":"https://openalex.org/C2781466463","wikidata":"https://www.wikidata.org/wiki/Q621695","display_name":"Blame","level":2,"score":0.5738999843597412},{"id":"https://openalex.org/C501734568","wikidata":"https://www.wikidata.org/wiki/Q42918","display_name":"Mutation","level":3,"score":0.5410000085830688},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.49790000915527344},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.49410000443458557},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3598000109195709},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34950000047683716},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3458000123500824},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2671999931335449},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.26249998807907104}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.04900","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.04900","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.04900","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.04900","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LLM-based":[0],"agents":[1],"depend":[2],"on":[3,143],"effective":[4],"tool-use":[5,65,75],"policies":[6,14],"to":[7,18,34,41,104,107,128],"solve":[8],"complex":[9],"tasks,":[10],"yet":[11],"optimizing":[12],"these":[13,53],"remains":[15],"challenging":[16],"due":[17],"delayed":[19],"supervision":[20],"and":[21,84,86,146,152],"the":[22],"difficulty":[23],"of":[24],"credit":[25],"assignment":[26],"in":[27,90],"long-horizon":[28],"trajectories.":[29],"Existing":[30],"optimization":[31],"approaches":[32],"tend":[33],"be":[35,157],"either":[36],"monolithic,":[37],"which":[38,46],"are":[39],"prone":[40],"entangling":[42],"behaviors,":[43],"or":[44],"single-aspect,":[45],"ignore":[47],"cross-module":[48],"error":[49],"propagation.":[50],"To":[51],"address":[52],"limitations,":[54],"we":[55],"propose":[56],"EvoTool,":[57],"a":[58,63,68,91,108],"self-evolving":[59],"framework":[60],"that":[61,117],"optimizes":[62],"modular":[64],"policy":[66,76],"via":[67,119],"gradient-free":[69],"evolutionary":[70],"paradigm.":[71],"EvoTool":[72,135],"decomposes":[73],"agent's":[74],"into":[77],"four":[78,133],"modules,":[79],"including":[80],"Planner,":[81],"Selector,":[82],"Caller,":[83],"Synthesizer,":[85],"iteratively":[87],"improves":[88],"them":[89],"self-improving":[92],"loop":[93],"through":[94],"three":[95],"novel":[96],"mechanisms.":[97],"Trajectory-Grounded":[98],"Blame":[99],"Attribution":[100],"uses":[101],"diagnostic":[102],"traces":[103],"localize":[105],"failures":[106],"specific":[109],"module.":[110],"Feedback-Guided":[111],"Targeted":[112],"Mutation":[113],"then":[114],"edits":[115],"only":[116],"module":[118],"natural-language":[120],"critique.":[121],"Diversity-Aware":[122],"Population":[123],"Selection":[124],"preserves":[125],"complementary":[126],"candidates":[127],"ensure":[129],"solution":[130],"diversity.":[131],"Across":[132],"benchmarks,":[134],"outperforms":[136],"strong":[137],"baselines":[138],"by":[139],"over":[140],"5":[141],"points":[142],"both":[144],"GPT-4.1":[145],"Qwen3-8B,":[147],"while":[148],"achieving":[149],"superior":[150],"efficiency":[151],"transferability.":[153],"The":[154],"code":[155],"will":[156],"released":[158],"once":[159],"paper":[160],"is":[161],"accepted.":[162]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-07T00:00:00"}
