{"id":"https://openalex.org/W4414760872","doi":"https://doi.org/10.1145/3711875.3729128","title":"CrossLM: A Data-Free Collaborative Fine-Tuning Framework for Large and Small Language Models","display_name":"CrossLM: A Data-Free Collaborative Fine-Tuning Framework for Large and Small Language Models","publication_year":2025,"publication_date":"2025-06-23","ids":{"openalex":"https://openalex.org/W4414760872","doi":"https://doi.org/10.1145/3711875.3729128"},"language":"en","primary_location":{"id":"doi:10.1145/3711875.3729128","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3711875.3729128","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3711875.3729128","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Annual International Conference on Mobile Systems, Applications and Services","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3711875.3729128","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037386169","display_name":"Yongheng Deng","orcid":"https://orcid.org/0000-0003-3010-3812"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yongheng Deng","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101278717","display_name":"Ziqing Qiao","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqing Qiao","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100449357","display_name":"Ye Zhang","orcid":"https://orcid.org/0000-0003-3038-9259"},"institutions":[{"id":"https://openalex.org/I78675632","display_name":"Beijing Information Science & Technology University","ror":"https://ror.org/04xnqep60","country_code":"CN","type":"education","lineage":["https://openalex.org/I78675632"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Zhang","raw_affiliation_strings":["Beijing Information Science and Technology University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Information Science and Technology University, Beijing, China","institution_ids":["https://openalex.org/I78675632"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064212646","display_name":"Zhenya Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenya Ma","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100356161","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0003-3800-3533"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Institute for AI Industry Research, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute for AI Industry Research, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015419107","display_name":"Ju Ren","orcid":"https://orcid.org/0000-0003-2782-183X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ju Ren","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5037386169"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14308715,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"124","last_page":"137"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5766000151634216},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.45820000767707825},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.43369999527931213},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.43369999527931213},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4239000082015991},{"id":"https://openalex.org/keywords/shared-resource","display_name":"Shared resource","score":0.34689998626708984},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data sharing","score":0.3407999873161316}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7037000060081482},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5766000151634216},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.45820000767707825},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.45590001344680786},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.43369999527931213},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.43369999527931213},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4239000082015991},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.34689998626708984},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.3407999873161316},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3249000012874603},{"id":"https://openalex.org/C109359841","wikidata":"https://www.wikidata.org/wiki/Q728944","display_name":"Inclusion (mineral)","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.26649999618530273},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.2612000107765198},{"id":"https://openalex.org/C2777319359","wikidata":"https://www.wikidata.org/wiki/Q6664444","display_name":"Local language","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2590000033378601},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3711875.3729128","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3711875.3729128","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3711875.3729128","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Annual International Conference on Mobile Systems, Applications and Services","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3711875.3729128","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3711875.3729128","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3711875.3729128","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Annual International Conference on Mobile Systems, Applications and Services","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414760872.pdf","grobid_xml":"https://content.openalex.org/works/W4414760872.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W2251939518","https://openalex.org/W2978670439","https://openalex.org/W3034238904","https://openalex.org/W3085873903","https://openalex.org/W3094163844","https://openalex.org/W3176828726","https://openalex.org/W3210103168","https://openalex.org/W4205991051","https://openalex.org/W4214607237","https://openalex.org/W4226101686","https://openalex.org/W4226480431","https://openalex.org/W4292779060","https://openalex.org/W4317926941","https://openalex.org/W4372260089","https://openalex.org/W4382618460","https://openalex.org/W4384026508","https://openalex.org/W4385572634","https://openalex.org/W4386245189","https://openalex.org/W4402684073","https://openalex.org/W4404237407"],"related_works":[],"abstract_inverted_index":{"While":[0],"large":[1,101],"language":[2,104,113,131,182],"models":[3,114],"(LLMs)":[4],"are":[5,67,123],"endowed":[6],"with":[7,18,53],"broad":[8],"knowledge,":[9],"their":[10,54,117],"task-specific":[11,19,119,129,191],"performance":[12,192],"is":[13,24,29],"often":[14,59],"suboptimal.":[15],"Fine-tuning":[16],"LLMs":[17,62,79,195],"data":[20,28,159],"from":[21,146],"diverse":[22],"nodes":[23,45,109,143],"necessary,":[25],"but":[26],"this":[27,91,153],"typically":[30],"safeguarded":[31],"and":[32,50,66,102,133,160,163,180,196],"not":[33],"shared":[34],"publicly":[35],"due":[36],"to":[37,69,110,126],"privacy":[38],"concerns.":[39],"A":[40],"common":[41],"solution":[42],"involves":[43],"downstream":[44],"downloading":[46],"the":[47,73,128,137,140,149,166,190,200],"LLM":[48],"locally":[49],"fine-tuning":[51,82,98],"it":[52],"proprietary":[55,161],"data.":[56,120],"However,":[57],"owners":[58],"regard":[60],"pre-trained":[61],"as":[63],"valuable":[64],"assets":[65],"reluctant":[68],"share":[70],"them.":[71],"Additionally,":[72],"significant":[74],"computational":[75],"resources":[76],"required":[77],"by":[78,148],"make":[80],"local":[81],"impractical":[83],"for":[84,100],"many":[85],"nodes.":[86,170],"To":[87],"mitigate":[88],"these":[89],"problems,":[90],"paper":[92],"proposes":[93],"CrossLM,":[94],"a":[95,175],"data-free":[96],"collaborative":[97],"framework":[99],"small":[103],"models.":[105],"CrossLM":[106,155,187],"enables":[107],"resource-constrained":[108],"train":[111],"smaller":[112],"(SLMs)":[115],"using":[116],"private":[118,158],"These":[121],"SLMs":[122,141,197],"subsequently":[124],"leveraged":[125],"promote":[127],"natural":[130],"generation":[132],"understanding":[134],"capabilities":[135,202],"of":[136,142,169,177,193,203],"LLMs.":[138,151,204],"Simultaneously,":[139],"also":[144,164],"benefit":[145],"enhancement":[147],"fine-tuned":[150],"In":[152],"way,":[154],"avoids":[156],"sharing":[157],"LLMs,":[162],"reduces":[165],"resource":[167],"requirements":[168],"Through":[171],"extensive":[172],"experiments":[173],"across":[174],"range":[176],"benchmark":[178],"tasks":[179],"popular":[181],"models,":[183],"we":[184],"demonstrate":[185],"that":[186],"significantly":[188],"boosts":[189],"both":[194],"while":[198],"preserving":[199],"generalization":[201]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
