{"id":"https://openalex.org/W4404570764","doi":"https://doi.org/10.48550/arxiv.2411.11266","title":"VersaTune: An Efficient Data Composition Framework for Training Multi-Capability LLMs","display_name":"VersaTune: An Efficient Data Composition Framework for Training Multi-Capability LLMs","publication_year":2024,"publication_date":"2024-11-18","ids":{"openalex":"https://openalex.org/W4404570764","doi":"https://doi.org/10.48550/arxiv.2411.11266"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2411.11266","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.11266","pdf_url":"https://arxiv.org/pdf/2411.11266","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2411.11266","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113407835","display_name":"Keer Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Keer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113407836","display_name":"Keshi Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Keshi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Zhuoran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhuoran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liang, Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Zheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004427460","display_name":"Da Pan","orcid":"https://orcid.org/0000-0002-1618-7389"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Da","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053410380","display_name":"Shusen Zhang","orcid":"https://orcid.org/0009-0002-1721-3865"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shusen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108167595","display_name":"X. Wu","orcid":"https://orcid.org/0000-0001-7655-389X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112223588","display_name":"Guosheng Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Guosheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062357883","display_name":"Bin Cui","orcid":"https://orcid.org/0000-0003-1681-4677"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Bin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wang, Tengjiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Tengjiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100459875","display_name":"Wentao Zhang","orcid":"https://orcid.org/0000-0003-4087-7280"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Wentao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fine-tuning","display_name":"Fine-tuning","score":0.4903245270252228},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.37504661083221436},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10111764073371887}],"concepts":[{"id":"https://openalex.org/C157524613","wikidata":"https://www.wikidata.org/wiki/Q2828883","display_name":"Fine-tuning","level":2,"score":0.4903245270252228},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.37504661083221436},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10111764073371887},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2411.11266","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.11266","pdf_url":"https://arxiv.org/pdf/2411.11266","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2411.11266","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2411.11266","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2411.11266","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.11266","pdf_url":"https://arxiv.org/pdf/2411.11266","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4390306690","https://openalex.org/W1969209172","https://openalex.org/W4385572141","https://openalex.org/W4281997472","https://openalex.org/W3046366884","https://openalex.org/W1729894570","https://openalex.org/W4221149036","https://openalex.org/W4385570168","https://openalex.org/W2957565634"],"abstract_inverted_index":{"As":[0],"demonstrated":[1],"by":[2,111,183,208],"the":[3,17,47,64,101,107,112,119,125,158,202,212,216],"proprietary":[4],"Large":[5],"Language":[6],"Models":[7],"(LLMs)":[8],"such":[9],"as":[10],"GPT":[11],"and":[12,139,181,186],"Claude":[13],"series,":[14],"LLMs":[15],"have":[16],"potential":[18,138],"to":[19,163],"achieve":[20],"remarkable":[21],"proficiency":[22],"across":[23,74],"a":[24,38,83,195],"wide":[25],"range":[26],"of":[27,66,72,103,155,194,215],"domains,":[28],"including":[29,178],"law,":[30],"medicine,":[31],"finance,":[32],"science,":[33],"code,":[34],"etc.,":[35],"all":[36],"within":[37,106],"single":[39],"model.":[40],"These":[41],"capabilities":[42,94],"are":[43,131],"further":[44],"augmented":[45],"during":[46,62,95],"Supervised":[48],"Fine-Tuning":[49],"(SFT)":[50],"phase.":[51],"Despite":[52],"their":[53,136],"potential,":[54],"existing":[55,121],"work":[56],"mainly":[57],"focuses":[58],"on":[59,135],"domain-specific":[60,104],"enhancements":[61],"fine-tuning,":[63],"challenge":[65],"which":[67],"lies":[68],"in":[69,149,157,189,205],"catastrophic":[70],"forgetting":[71,140],"knowledge":[73,105,122],"other":[75,206],"domains.":[76],"In":[77],"this":[78],"study,":[79],"we":[80,168],"introduce":[81],"**VersaTune**,":[82],"novel":[84],"data":[85,114],"composition":[86,115],"framework":[87],"designed":[88],"for":[89],"enhancing":[90],"LLMs'":[91],"overall":[92,159],"multi-domain":[93,150],"training.":[96],"We":[97],"begin":[98],"with":[99,118,152],"detecting":[100],"distribution":[102],"base":[108],"model,":[109],"followed":[110],"training":[113,127,213],"that":[116,145,170],"aligns":[117],"model's":[120],"distribution.":[123],"During":[124],"subsequent":[126],"process,":[128],"domain":[129,165,197],"weights":[130],"dynamically":[132],"adjusted":[133],"based":[134],"learnable":[137],"degree.":[141],"Experimental":[142],"results":[143],"indicate":[144],"VersaTune":[146,173,200],"is":[147,198],"effective":[148],"fostering,":[151],"an":[153],"improvement":[154],"35.21\\%":[156],"multi-ability":[160],"performances":[161],"compared":[162],"uniform":[164],"weights.":[166],"Furthermore,":[167],"find":[169],"Qwen-2.5-32B":[171],"+":[172],"even":[174],"surpasses":[175],"frontier":[176],"models,":[177],"GPT-4o,":[179],"Claude3.5-Sonnet":[180],"DeepSeek-V3":[182],"0.86\\%,":[184],"4.76\\%":[185],"4.60\\%.":[187],"Additionally,":[188],"scenarios":[190],"where":[191],"flexible":[192],"expansion":[193],"specific":[196],"required,":[199],"reduces":[201],"performance":[203],"degradation":[204],"domains":[207],"38.77\\%,":[209],"while":[210],"preserving":[211],"efficacy":[214],"target":[217],"domain.":[218]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2024-11-21T00:00:00"}
