{"id":"https://openalex.org/W7133528385","doi":"https://doi.org/10.48550/arxiv.2603.02766","title":"EvoSkill: Automated Skill Discovery for Multi-Agent Systems","display_name":"EvoSkill: Automated Skill Discovery for Multi-Agent Systems","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133528385","doi":"https://doi.org/10.48550/arxiv.2603.02766"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02766","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104631569","display_name":"Salaheddin Alzubi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alzubi, Salaheddin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128101064","display_name":"Noah Provenzano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Provenzano, Noah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128041109","display_name":"Jaydon Bingham","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bingham, Jaydon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128039729","display_name":"Weiyuan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Weiyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5110616429","display_name":"Tu Vu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vu, Tu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1331000030040741,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1331000030040741,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.0957999974489212,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.0786999985575676,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6565999984741211},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6294000148773193},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.57669997215271},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4609000086784363},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.44119998812675476},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.3203999996185303},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.31360000371932983}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7620999813079834},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6565999984741211},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6294000148773193},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.57669997215271},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5361999869346619},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5293999910354614},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4609000086784363},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.44119998812675476},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3368000090122223},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.31360000371932983},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.28619998693466187},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.28349998593330383},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C169903001","wikidata":"https://www.wikidata.org/wiki/Q3264987","display_name":"Reciprocity (cultural anthropology)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C2780889827","wikidata":"https://www.wikidata.org/wiki/Q10756188","display_name":"Treasury","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8142126798629761,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Coding":[0],"agents":[1,37],"are":[2,44,58],"increasingly":[3],"used":[4],"as":[5],"general-purpose":[6],"problem":[7],"solvers,":[8],"but":[9],"their":[10],"flexibility":[11],"does":[12],"not":[13],"by":[14,145,196],"itself":[15],"confer":[16],"the":[17,120,171,182,208],"domain":[18],"expertise":[19],"needed":[20],"for":[21],"specialized":[22],"tasks.":[23,65],"Recent":[24],"work":[25],"addresses":[26],"this":[27],"through":[28,79],"\\textit{agent":[29],"skills}:":[30],"reusable":[31,100],"workflows,":[32],"and":[33,46,64,75,95,150],"code,":[34],"that":[35,57,72,114,201],"augment":[36],"with":[38,156],"domain-specific":[39],"capabilities.":[40],"Most":[41],"skills":[42,78,89,113,176,186],"today":[43],"hand-crafted,":[45],"existing":[47,93],"evolutionary":[48],"approaches":[49],"optimize":[50],"low-level":[51],"artifacts":[52],"(e.g.":[53],"prompts":[54],"\\&amp;":[55],"code)":[56],"tightly":[59],"coupled":[60],"to":[61,92,181,192],"specific":[62],"models":[63],"We":[66,125,168],"introduce":[67],"\\textbf{EvoSkill},":[68],"a":[69,132,152,162],"self-evolving":[70],"framework":[71],"automatically":[73],"discovers":[74],"refines":[76],"agent":[77,107],"iterative":[80],"failure":[81],"analysis.":[82],"EvoSkill":[83,127],"analyzes":[84],"execution":[85],"failures,":[86],"proposes":[87],"new":[88],"or":[90],"edits":[91],"ones,":[94],"materializes":[96],"them":[97],"into":[98],"structured,":[99],"skill":[101],"folders.":[102],"A":[103],"Pareto":[104],"frontier":[105],"of":[106,175],"programs":[108],"governs":[109],"selection,":[110],"retaining":[111],"only":[112],"improve":[115],"held-out":[116],"validation":[117],"performance":[118],"while":[119],"underlying":[121],"model":[122],"remains":[123],"frozen.":[124],"evaluate":[126],"on":[128,178],"two":[129],"benchmarks:":[130],"OfficeQA,":[131],"grounded":[133],"reasoning":[134],"benchmark":[135,155],"over":[136],"U.S.\\":[137],"Treasury":[138],"data,":[139],"where":[140,159],"it":[141,160],"improves":[142],"exact-match":[143],"accuracy":[144,195],"\\textbf{7.3\\%}":[146],"(60.6\\%":[147],"$\\to$":[148,166],"67.9\\%);":[149],"SealQA,":[151],"search-augmented":[153],"QA":[154],"noisy":[157],"retrieval,":[158],"yields":[161],"\\textbf{12.1\\%}":[163],"gain":[164],"(26.6\\%":[165],"38.7\\%).":[167],"also":[169],"investigate":[170],"zero-shot":[172,191],"transfer":[173],"capabilties":[174],"evolved":[177,187],"one":[179],"task":[180],"other;":[183],"in":[184],"particular:":[185],"from":[188],"SealQA":[189],"transfers":[190],"BrowseComp,":[193],"improving":[194],"\\textbf{5.3\\%}":[197],"without":[198],"modification":[199],"demonstrating":[200],"skill-level":[202],"optimization":[203],"produces":[204],"transferable":[205],"capabilities":[206],"beyond":[207],"training":[209],"task.":[210]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-05T00:00:00"}
