{"id":"https://openalex.org/W4405714780","doi":"https://doi.org/10.48550/arxiv.2412.15495","title":"TL-Training: A Task-Feature-Based Framework for Training Large Language Models in Tool Use","display_name":"TL-Training: A Task-Feature-Based Framework for Training Large Language Models in Tool Use","publication_year":2024,"publication_date":"2024-12-20","ids":{"openalex":"https://openalex.org/W4405714780","doi":"https://doi.org/10.48550/arxiv.2412.15495"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2412.15495","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.15495","pdf_url":"https://arxiv.org/pdf/2412.15495","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2412.15495","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100777718","display_name":"Junjie Ye","orcid":"https://orcid.org/0009-0004-0921-6323"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ye, Junjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100864237","display_name":"Yilong Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yilong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000525969","display_name":"Sixian Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Sixian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100958962","display_name":"Yuming Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yuming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xi, Zhiheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xi, Zhiheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058353652","display_name":"Tao Gui","orcid":"https://orcid.org/0000-0002-6154-0751"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gui, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100360407","display_name":"Qi Zhang","orcid":"https://orcid.org/0000-0003-0947-4942"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Qi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000409439","display_name":"Jimmy Xiangji Huang","orcid":"https://orcid.org/0000-0003-1292-1491"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Xuanjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100395978","display_name":"Peng Wang","orcid":"https://orcid.org/0000-0002-1328-5784"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Peng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101873354","display_name":"Zhongchao Shi","orcid":"https://orcid.org/0000-0002-5216-3827"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Zhongchao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Fan, Jianping","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Jianping","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5079606191","display_name":"Zhengyin Du","orcid":"https://orcid.org/0000-0002-7124-8754"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Zhengyin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5100777718"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9666000008583069,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9666000008583069,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.8525463342666626},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7738330364227295},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.7392485737800598},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6675598621368408},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.47585269808769226},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4162237048149109},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39277368783950806},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.15853747725486755},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12692248821258545},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.06646785140037537},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.05729717016220093}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.8525463342666626},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7738330364227295},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.7392485737800598},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6675598621368408},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.47585269808769226},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4162237048149109},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39277368783950806},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.15853747725486755},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12692248821258545},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.06646785140037537},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.05729717016220093},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2412.15495","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.15495","pdf_url":"https://arxiv.org/pdf/2412.15495","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2412.15495","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2412.15495","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2412.15495","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.15495","pdf_url":"https://arxiv.org/pdf/2412.15495","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320309612","display_name":"Natural Science Foundation of Shanghai","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320327803","display_name":"Shanghai Rising-Star Program","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405714780.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W3216976533","https://openalex.org/W100620283","https://openalex.org/W4394050964","https://openalex.org/W2551249631","https://openalex.org/W3098003361"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"achieve":[4],"remarkable":[5],"advancements":[6],"by":[7,125,143],"leveraging":[8],"tools":[9],"to":[10,40,101,114],"interact":[11],"with":[12],"environments,":[13],"a":[14,75,86,109,177],"critical":[15],"step":[16],"toward":[17],"generalized":[18],"AI.":[19],"However,":[20],"the":[21,91,140],"standard":[22],"supervised":[23],"fine-tuning":[24],"(SFT)":[25],"approach,":[26],"which":[27],"relies":[28],"on":[29,81,131],"large-scale":[30],"datasets,":[31],"often":[32],"overlooks":[33],"task-specific":[34],"characteristics":[35],"in":[36,70,154,168,185],"tool":[37,71],"use,":[38],"leading":[39],"performance":[41,156],"bottlenecks.":[42],"To":[43],"address":[44],"this":[45],"issue,":[46],"we":[47,84],"analyze":[48],"three":[49],"existing":[50],"LLMs":[51,153],"and":[52,68,107,128,151,171,179,188],"uncover":[53],"key":[54,103],"insights:":[55],"training":[56,95,126,160,184],"data":[57,161,189],"can":[58],"inadvertently":[59],"impede":[60],"tool-use":[61,155,183],"behavior,":[62],"token":[63,99],"importance":[64],"is":[65],"distributed":[66],"unevenly,":[67],"errors":[69],"calls":[72],"fall":[73],"into":[74],"small":[76],"set":[77],"of":[78,93],"categories.":[79],"Building":[80],"these":[82],"findings,":[83],"propose~\\emph{TL-Training},":[85],"task-feature-based":[87],"framework":[88],"that":[89,139],"mitigates":[90],"effects":[92],"suboptimal":[94],"data,":[96],"dynamically":[97],"adjusts":[98],"weights":[100],"prioritize":[102],"tokens":[104],"during":[105],"SFT,":[106],"incorporates":[108],"robust":[110],"reward":[111],"mechanism":[112],"tailored":[113],"error":[115],"categories,":[116],"optimized":[117],"through":[118],"proximal":[119],"policy":[120],"optimization.":[121],"We":[122],"validate":[123],"TL-Training":[124],"CodeLLaMA-2-7B":[127],"evaluating":[129],"it":[130],"four":[132],"open-source":[133],"test":[134],"sets.":[135],"Our":[136],"results":[137],"demonstrate":[138],"LLM":[141],"trained":[142],"our":[144,164],"method":[145,165],"matches":[146],"or":[147],"surpasses":[148],"both":[149],"open-":[150],"closed-source":[152],"using":[157],"only":[158],"1,217":[159],"points.":[162],"Additionally,":[163],"enhances":[166],"robustness":[167],"noisy":[169],"environments":[170],"improves":[172],"general":[173],"task":[174],"performance,":[175],"offering":[176],"scalable":[178],"efficient":[180],"paradigm":[181],"for":[182],"LLMs.":[186],"Code":[187],"are":[190],"available":[191],"at":[192],"https://github.com/Junjie-Ye/TL-Training.":[193]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
