{"id":"https://openalex.org/W7135229300","doi":"https://doi.org/10.48550/arxiv.2603.11076","title":"DIVE: Scaling Diversity in Agentic Task Synthesis for Generalizable Tool Use","display_name":"DIVE: Scaling Diversity in Agentic Task Synthesis for Generalizable Tool Use","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7135229300","doi":"https://doi.org/10.48550/arxiv.2603.11076"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.11076","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11076","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.11076","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129026937","display_name":"Aili Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Aili","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128978507","display_name":"Chi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129092383","display_name":"Junteng Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Junteng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129042288","display_name":"Jiangjie Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiangjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101932247","display_name":"Cong Du","orcid":"https://orcid.org/0000-0003-4179-2836"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Chengyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102753810","display_name":"Yunji Li","orcid":"https://orcid.org/0000-0002-1252-9601"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yunji","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128932862","display_name":"Ming Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Ming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128936046","display_name":"Qin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Qin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129016392","display_name":"Zhengmao Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Zhengmao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128946196","display_name":"Jiayuan Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Jiayuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102635132","display_name":"Ke Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Ke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129090537","display_name":"Junxian He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Junxian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043176786","display_name":"Pengyu Zhao","orcid":"https://orcid.org/0000-0002-0514-2548"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Pengyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128961850","display_name":"Yanghua Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Yanghua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.15360000729560852,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.15360000729560852,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.13230000436306,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.07509999722242355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7657999992370605},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.7537000179290771},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6990000009536743},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.6766999959945679},{"id":"https://openalex.org/keywords/diversity","display_name":"Diversity (politics)","score":0.6704999804496765},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5871000289916992},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.4587000012397766},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.39340001344680786},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.3847000002861023}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7657999992370605},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.7537000179290771},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7265999913215637},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6990000009536743},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.6766999959945679},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.6704999804496765},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5871000289916992},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4823000133037567},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47350001335144043},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.4587000012397766},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.39340001344680786},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3847000002861023},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3808000087738037},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3776000142097473},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.36980000138282776},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3564999997615814},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.35249999165534973},{"id":"https://openalex.org/C2778166243","wikidata":"https://www.wikidata.org/wiki/Q5283969","display_name":"Diversity training","level":3,"score":0.2922999858856201},{"id":"https://openalex.org/C91682802","wikidata":"https://www.wikidata.org/wiki/Q620538","display_name":"Multidimensional scaling","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.27880001068115234},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.27709999680519104},{"id":"https://openalex.org/C198647972","wikidata":"https://www.wikidata.org/wiki/Q44475","display_name":"Spear","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2736000120639801},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C88626702","wikidata":"https://www.wikidata.org/wiki/Q1128903","display_name":"Continuation","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2644999921321869},{"id":"https://openalex.org/C130440534","wikidata":"https://www.wikidata.org/wiki/Q14946528","display_name":"Conflation","level":2,"score":0.26249998807907104},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.11076","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11076","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.11076","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11076","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"work":[1],"synthesizes":[2],"agentic":[3],"tasks":[4,15,39,76],"for":[5,159],"post-training":[6],"tool-using":[7],"LLMs,":[8],"yet":[9],"robust":[10],"generalization":[11,46],"under":[12],"shifts":[13],"in":[14,29,117],"and":[16,43,55,74,98,102,139],"toolsets":[17],"remains":[18],"an":[19,62,103],"open":[20],"challenge.":[21],"We":[22,59],"trace":[23],"this":[24],"brittleness":[25],"to":[26,40],"insufficient":[27],"diversity":[28,33,91,153],"synthesized":[30],"tasks.":[31],"Scaling":[32],"is":[34],"difficult":[35],"because":[36],"training":[37],"requires":[38],"remain":[41],"executable":[42],"verifiable,":[44],"while":[45],"demands":[47],"coverage":[48,97],"of":[49],"diverse":[50],"tool":[51],"types,":[52],"toolset":[53,100],"combinations,":[54],"heterogeneous":[56],"tool-use":[57,112],"patterns.":[58],"propose":[60],"DIVE,":[61],"evidence-driven":[63],"recipe":[64],"that":[65,152],"inverts":[66],"synthesis":[67],"order,":[68],"executing":[69],"diverse,":[70],"real-world":[71],"tools":[72,116],"first":[73],"reverse-deriving":[75],"strictly":[77],"entailed":[78],"by":[79,86,131,145],"the":[80,141],"resulting":[81],"traces,":[82],"thereby":[83],"providing":[84],"grounding":[85],"construction.":[87],"DIVE":[88,123],"scales":[89],"structural":[90],"along":[92],"two":[93],"controllable":[94],"axes,":[95],"tool-pool":[96],"per-task":[99],"variety,":[101],"Evidence":[104],"Collection--Task":[105],"Derivation":[106],"loop":[107],"further":[108],"induces":[109],"rich":[110],"multi-step":[111],"patterns":[113],"across":[114,135],"373":[115],"five":[118],"domains.":[119],"Training":[120],"Qwen3-8B":[121],"on":[122],"data":[124],"(48k":[125],"SFT":[126],"+":[127],"3.2k":[128],"RL)":[129],"improves":[130],"+22":[132],"average":[133],"points":[134],"9":[136],"OOD":[137,160],"benchmarks":[138],"outperforms":[140,156],"strongest":[142],"8B":[143],"baseline":[144],"+68.":[146],"Remarkably,":[147],"controlled":[148],"scaling":[149,154,158],"analysis":[150],"reveals":[151],"consistently":[155],"quantity":[157],"generalization,":[161],"even":[162],"with":[163],"4x":[164],"less":[165],"data.":[166]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-14T00:00:00"}
