{"id":"https://openalex.org/W7160930518","doi":"https://doi.org/10.48550/arxiv.2605.08887","title":"Ace-Skill: Bootstrapping Multimodal Agents with Prioritized and Clustered Evolution","display_name":"Ace-Skill: Bootstrapping Multimodal Agents with Prioritized and Clustered Evolution","publication_year":2026,"publication_date":"2026-05-09","ids":{"openalex":"https://openalex.org/W7160930518","doi":"https://doi.org/10.48550/arxiv.2605.08887"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.08887","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08887","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.08887","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135983657","display_name":"Feng Xiong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Feng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135948875","display_name":"Zengbin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zengbin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135979985","display_name":"Yong Wang","orcid":"https://orcid.org/0000-0001-7547-1542"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041762969","display_name":"Xuecai Hu","orcid":"https://orcid.org/0000-0003-0483-0418"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xuecai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135984429","display_name":"Jinghan He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Jinghan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135954245","display_name":"Liang Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135928490","display_name":"Yuan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135969677","display_name":"Xiangxiang Chu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu, Xiangxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.0746999979019165,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.0746999979019165,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.07400000095367432,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.066600002348423,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5633999705314636},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5092999935150146},{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.4918000102043152},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.450300008058548},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.36329999566078186},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.35429999232292175},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.34940001368522644},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.34619998931884766},{"id":"https://openalex.org/keywords/thompson-sampling","display_name":"Thompson sampling","score":0.329800009727478}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.789900004863739},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5633999705314636},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5092999935150146},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.4918000102043152},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.450300008058548},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.36329999566078186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.362199991941452},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.34940001368522644},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.34619998931884766},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33889999985694885},{"id":"https://openalex.org/C73602740","wikidata":"https://www.wikidata.org/wiki/Q7795822","display_name":"Thompson sampling","level":3,"score":0.329800009727478},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.31839999556541443},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.31690001487731934},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.30489999055862427},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.302700012922287},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2838999927043915},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C134121241","wikidata":"https://www.wikidata.org/wiki/Q899301","display_name":"Yield (engineering)","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.08887","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08887","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.08887","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08887","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Self-evolving":[0],"agents":[1,207],"present":[2],"a":[3,64,87,121,145,196],"promising":[4],"path":[5],"toward":[6],"continual":[7],"adaptation":[8],"by":[9,23],"distilling":[10],"task":[11],"interactions":[12],"into":[13,144],"reusable":[14],"knowledge":[15,44,48,96,127,155,191],"artifacts.":[16],"In":[17,81],"practice,":[18],"this":[19,82],"paradigm":[20],"remains":[21],"hindered":[22],"two":[24],"coupled":[25],"bottlenecks:":[26],"data":[27],"inefficiency,":[28],"where":[29,46],"costly":[30],"rollout":[31,93],"effort":[32],"is":[33],"disproportionately":[34],"spent":[35],"on":[36,114],"low-value":[37],"samples":[38],"rather":[39],"than":[40],"informative":[41,115,151],"ones,":[42],"and":[43,57,95,116,120,131,138,202],"interference,":[45],"heterogeneous":[47],"stored":[49],"in":[50,68,76,148,174,195],"shared":[51],"repositories":[52],"leads":[53],"to":[54,111,183,199,208],"noisy":[55,73],"retrieval":[56,130],"task-misaligned":[58],"guidance.":[59],"Together,":[60],"these":[61],"issues":[62],"form":[63],"self-reinforcing":[65],"failure":[66],"loop":[67],"which":[69,75,149],"uninformative":[70],"rollouts":[71,113,152],"yield":[72],"knowledge,":[74],"turn":[77],"degrades":[78],"subsequent":[79,159],"rollouts.":[80,160],"work,":[83],"we":[84],"introduce":[85],"Ace-Skill,":[86],"co-evolutionary":[88],"framework":[89],"that":[90,124,156],"jointly":[91],"optimizes":[92],"allocation":[94],"organization":[97,139],"for":[98,128],"self-evolving":[99],"multimodal":[100,163],"agents.":[101],"Specifically,":[102],"Ace-Skill":[103,141,166],"combines":[104],"aprioritized":[105],"sampler":[106],"with":[107],"lazy-decay":[108],"proficiency":[109],"tracking":[110],"focus":[112],"insufficiently":[117],"mastered":[118],"samples,":[119],"clustered":[122],"organizer":[123],"semantically":[125],"clusters":[126],"cleaner":[129],"more":[132,150],"reliable":[133],"adaptation.":[134],"By":[135],"improving":[136],"sampling":[137],"together,":[140],"turns":[142],"self-evolution":[143],"virtuous":[146],"cycle":[147],"produce":[153],"higher-quality":[154],"supports":[157],"stronger":[158],"Across":[161],"four":[162],"tool-use":[164],"benchmarks,":[165],"delivers":[167],"strong":[168],"gains":[169],"(e.g.,":[170],"+35.46%":[171],"relative":[172],"improvement":[173],"Avg@4":[175],"accuracy),":[176],"enabling":[177],"an":[178],"opensource":[179],"35B":[180],"MoE":[181],"model":[182],"match":[184],"or":[185],"surpass":[186],"proprietary":[187],"models.":[188],"The":[189,215],"acquired":[190],"also":[192],"transfers":[193],"effectively":[194],"zero-shot":[197],"manner":[198],"smaller":[200],"9B":[201],"4B":[203],"models,":[204],"allowing":[205],"resource-constrained":[206],"inherit":[209],"advanced":[210],"capabilities":[211],"without":[212],"additional":[213],"training.":[214],"code":[216],"has":[217],"been":[218],"publicly":[219],"available":[220],"at":[221],"https://github.com/AMAP-ML/Ace-Skill.":[222]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
