{"id":"https://openalex.org/W4416286402","doi":"https://doi.org/10.1109/jstsp.2025.3633550","title":"MobiLLM: Enabling On-Device Fine-Tuning of Billion-Sized LLMs via Server-Assisted Side-Tuning","display_name":"MobiLLM: Enabling On-Device Fine-Tuning of Billion-Sized LLMs via Server-Assisted Side-Tuning","publication_year":2025,"publication_date":"2025-10-01","ids":{"openalex":"https://openalex.org/W4416286402","doi":"https://doi.org/10.1109/jstsp.2025.3633550"},"language":null,"primary_location":{"id":"doi:10.1109/jstsp.2025.3633550","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2025.3633550","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Liang Li","orcid":"https://orcid.org/0000-0003-3369-3571"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liang Li","raw_affiliation_strings":["Frontier Research Center, Pengcheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Frontier Research Center, Pengcheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xingke Yang","orcid":"https://orcid.org/0009-0005-1243-0029"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xingke Yang","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","Department of Electrical and Computer Engineering, University of Houston, Houston, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","institution_ids":["https://openalex.org/I44461941"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074854979","display_name":"Wen Wu","orcid":"https://orcid.org/0000-0002-0458-1282"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Wu","raw_affiliation_strings":["Frontier Research Center, Pengcheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Frontier Research Center, Pengcheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100769481","display_name":"Hao Wang","orcid":"https://orcid.org/0000-0002-1444-2657"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hao Wang","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Stevens Institue of Technology, Hoboken, NJ, USA","Department of Electrical and Computer Engineering, Stevens Institue of Technology, Hoboken, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Stevens Institue of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Stevens Institue of Technology, Hoboken, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016337773","display_name":"Tomoaki Ohtsuki","orcid":null},"institutions":[{"id":"https://openalex.org/I203951103","display_name":"Keio University","ror":"https://ror.org/02kn6nx58","country_code":"JP","type":"education","lineage":["https://openalex.org/I203951103"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomoaki Ohtsuki","raw_affiliation_strings":["Department of Information and Computer Science, Keio University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Information and Computer Science, Keio University, Tokyo, Japan","institution_ids":["https://openalex.org/I203951103"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xin Fu","orcid":"https://orcid.org/0000-0002-9458-4769"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Fu","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","Department of Electrical and Computer Engineering, University of Houston, Houston, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","institution_ids":["https://openalex.org/I44461941"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047722991","display_name":"Miao Pan","orcid":"https://orcid.org/0000-0003-2138-4413"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Miao Pan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","Department of Electrical and Computer Engineering, University of Houston, Houston, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","institution_ids":["https://openalex.org/I44461941"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100773343","display_name":"Xuemin Shen","orcid":"https://orcid.org/0000-0002-4140-287X"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Xuemin Shen","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Waterloo, Waterloo, Ontario, Canada","Department of Electrical and Computer Engineering, University of Waterloo, Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Waterloo, Waterloo, Ontario, Canada","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210136793"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.347823,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"19","issue":"7","first_page":"1251","last_page":"1265"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.10360000282526016,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.10360000282526016,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.07580000162124634,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.06930000334978104,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mobile-device","display_name":"Mobile device","score":0.7454000115394592},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.6715999841690063},{"id":"https://openalex.org/keywords/mobile-computing","display_name":"Mobile computing","score":0.5209000110626221},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5199999809265137},{"id":"https://openalex.org/keywords/mobile-telephony","display_name":"Mobile telephony","score":0.5029000043869019},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4674000144004822},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.4458000063896179},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.40400001406669617},{"id":"https://openalex.org/keywords/mobile-processor","display_name":"Mobile processor","score":0.4007999897003174}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8287000060081482},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.7454000115394592},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.6715999841690063},{"id":"https://openalex.org/C144543869","wikidata":"https://www.wikidata.org/wiki/Q2738570","display_name":"Mobile computing","level":2,"score":0.5209000110626221},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5199999809265137},{"id":"https://openalex.org/C95491727","wikidata":"https://www.wikidata.org/wiki/Q992968","display_name":"Mobile telephony","level":3,"score":0.5029000043869019},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.47699999809265137},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4674000144004822},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.4458000063896179},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.40400001406669617},{"id":"https://openalex.org/C1665295","wikidata":"https://www.wikidata.org/wiki/Q6887219","display_name":"Mobile processor","level":5,"score":0.4007999897003174},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.3986000120639801},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.36550000309944153},{"id":"https://openalex.org/C78834623","wikidata":"https://www.wikidata.org/wiki/Q640394","display_name":"Mobile broadband","level":3,"score":0.3287000060081482},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3222000002861023},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.3046000003814697},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C4373008","wikidata":"https://www.wikidata.org/wiki/Q513349","display_name":"File server","level":2,"score":0.2903999984264374},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.29030001163482666},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.28139999508857727},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.2669999897480011},{"id":"https://openalex.org/C2781307350","wikidata":"https://www.wikidata.org/wiki/Q6887221","display_name":"Mobile radio","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C160949748","wikidata":"https://www.wikidata.org/wiki/Q1365703","display_name":"Mobile payment","level":3,"score":0.25760000944137573},{"id":"https://openalex.org/C2776061582","wikidata":"https://www.wikidata.org/wiki/Q25325231","display_name":"Mobile edge computing","level":3,"score":0.2547999918460846},{"id":"https://openalex.org/C127353759","wikidata":"https://www.wikidata.org/wiki/Q6887091","display_name":"Mobile database","level":4,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jstsp.2025.3633550","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2025.3633550","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5100585654","display_name":null,"funder_award_id":"CNS-2318664","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5309008270","display_name":null,"funder_award_id":"CSR-2403249","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6778322719","display_name":null,"funder_award_id":"62201311","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6781623049","display_name":null,"funder_award_id":"CNS-2107057","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7199852738","display_name":null,"funder_award_id":"62201071","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7270636821","display_name":null,"funder_award_id":"CNS-2431596","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W2109553965","https://openalex.org/W2251939518","https://openalex.org/W2739351760","https://openalex.org/W2896457183","https://openalex.org/W2923014074","https://openalex.org/W2963748441","https://openalex.org/W2963846996","https://openalex.org/W2969388332","https://openalex.org/W2978670439","https://openalex.org/W2979826702","https://openalex.org/W3152952112","https://openalex.org/W3163231210","https://openalex.org/W3176828726","https://openalex.org/W4205946715","https://openalex.org/W4319778953","https://openalex.org/W4322766882","https://openalex.org/W4372260089","https://openalex.org/W4379033976","https://openalex.org/W4380926665","https://openalex.org/W4381785874","https://openalex.org/W4388692014","https://openalex.org/W4399121685","https://openalex.org/W4406856790","https://openalex.org/W4410294847","https://openalex.org/W4411446549","https://openalex.org/W4411799547","https://openalex.org/W4414539465"],"related_works":[],"abstract_inverted_index":{"On-device":[0],"fine-tuning":[1,54],"of":[2,11,14,125],"large":[3],"language":[4],"models":[5,18],"(LLMs)":[6],"has":[7],"attracted":[8],"a":[9,48,56,82,93,193],"lot":[10],"attention":[12],"because":[13],"its":[15],"tailoring":[16],"personalized":[17],"while":[19,73,143,161],"retaining":[20],"user":[21],"data":[22,132,154],"locally":[23],"on":[24,55,172],"the":[25,75,101,106,117,135,153,157],"mobile":[26,58,77,136,159,164,175,195],"device.":[27],"However,":[28],"it":[29],"faces":[30],"significant":[31],"challenges":[32],"due":[33],"to":[34,69,79,116,119,134,197,203,219],"prohibitive":[35],"memory":[36,165,208],"requirements":[37],"and":[38,138,166,182,210],"slow":[39],"training":[40,131],"speeds.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45],"propose":[46],"MobiLLM,":[47],"novel":[49],"scheme":[50],"enabling":[51],"memory-efficient":[52],"LLM":[53],"single":[57],"device":[59,78,107,160,196],"via":[60,96],"server-assisted":[61],"side-tuning.":[62],"Particularly,":[63],"MobiLLM":[64,126,151,171,190],"strategically":[65],"offloads":[66],"backpropagation":[67,94,142],"computations":[68,146],"an":[70],"edge":[71],"server":[72,118,148],"allowing":[74],"resource-constrained":[76,194],"retain":[80],"merely":[81],"pretrained":[83],"backbone":[84],"model":[85],"with":[86,147],"frozen":[87],"parameters":[88],"during":[89],"finetuning.":[90],"It":[91],"constructs":[92],"bypass":[95],"parallel":[97],"adapters":[98],"decoupled":[99],"from":[100],"backbone.":[102],"During":[103],"forward":[104],"propagation,":[105],"employs":[108],"low":[109],"bitwidth":[110],"quantization":[111],"for":[112],"transmitting":[113],"intermediate":[114],"activations":[115],"reduce":[120],"communication":[121],"overhead.":[122],"The":[123],"advantage":[124],"lies":[127],"in:":[128],"1)":[129],"confining":[130],"strictly":[133],"device,":[137],"2)":[139],"eliminating":[140],"on-device":[141],"overlapping":[144],"local":[145,158],"execution.":[149],"Collectively,":[150],"ensures":[152],"never":[155],"leaves":[156],"significantly":[162],"reducing":[163],"computational":[167],"burdens.":[168],"We":[169],"implement":[170],"several":[173],"popular":[174],"devices,":[176],"including":[177],"NVIDIA":[178],"Jetson":[179],"Xavier":[180],"NX":[181],"CPU-only":[183],"laptops.":[184],"Extensive":[185],"experimental":[186],"results":[187],"demonstrate":[188],"that":[189],"can":[191],"enable":[192],"fine-tune":[198],"billion-sized":[199],"LLMs,":[200],"achieving":[201],"up":[202],"<inline-formula":[204,211],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[205,212],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[206,213],"notation=\"LaTeX\">$4\\times$</tex-math></inline-formula>":[207],"reduction":[209],"notation=\"LaTeX\">$2.3\\times$</tex-math></inline-formula>":[214],"faster":[215],"convergence":[216],"as":[217],"compared":[218],"state-of-the-art":[220],"baselines.":[221]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-17T00:00:00"}
