{"id":"https://openalex.org/W4408017080","doi":"https://doi.org/10.1109/tmc.2025.3546466","title":"EdgeMoE: Empowering Sparse Large Language Models on Mobile Devices","display_name":"EdgeMoE: Empowering Sparse Large Language Models on Mobile Devices","publication_year":2025,"publication_date":"2025-02-27","ids":{"openalex":"https://openalex.org/W4408017080","doi":"https://doi.org/10.1109/tmc.2025.3546466"},"language":"en","primary_location":{"id":"doi:10.1109/tmc.2025.3546466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3546466","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049544852","display_name":"Rongjie Yi","orcid":"https://orcid.org/0009-0003-6040-9596"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rongjie Yi","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102749086","display_name":"Liwei Guo","orcid":"https://orcid.org/0000-0001-8516-8045"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liwei Guo","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China","University of Electronic Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"University of Electronic Science and Technology of China, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076282381","display_name":"Shu-Shang Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shiyun Wei","raw_affiliation_strings":["Zhongguancun Laboratory, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Zhongguancun Laboratory, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016717153","display_name":"Ao Zhou","orcid":"https://orcid.org/0000-0001-5743-9418"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ao Zhou","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054814598","display_name":"Shangguang Wang","orcid":"https://orcid.org/0000-0001-7245-1298"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shangguang Wang","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089690212","display_name":"Mengwei Xu","orcid":"https://orcid.org/0000-0001-6271-6993"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengwei Xu","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5049544852"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":43.0892,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.99754345,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"24","issue":"8","first_page":"7059","last_page":"7073"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9667999744415283,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.9639000296592712,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.842663049697876},{"id":"https://openalex.org/keywords/mobile-computing","display_name":"Mobile computing","score":0.4718599021434784},{"id":"https://openalex.org/keywords/mobile-device","display_name":"Mobile device","score":0.460789293050766},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.32315897941589355},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.29385727643966675},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.21754246950149536}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.842663049697876},{"id":"https://openalex.org/C144543869","wikidata":"https://www.wikidata.org/wiki/Q2738570","display_name":"Mobile computing","level":2,"score":0.4718599021434784},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.460789293050766},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32315897941589355},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.29385727643966675},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.21754246950149536}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmc.2025.3546466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3546466","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4778515295","display_name":null,"funder_award_id":"U21B2016","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7483642958","display_name":null,"funder_award_id":"62032003","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8529090286","display_name":null,"funder_award_id":"62425203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8882584335","display_name":null,"funder_award_id":"2024ZCJH11","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W1977628053","https://openalex.org/W2150884987","https://openalex.org/W2546536770","https://openalex.org/W2612395950","https://openalex.org/W2623333128","https://openalex.org/W2625157458","https://openalex.org/W2626129225","https://openalex.org/W2860338957","https://openalex.org/W2889402930","https://openalex.org/W2909099954","https://openalex.org/W2931633209","https://openalex.org/W2996874060","https://openalex.org/W3045818398","https://openalex.org/W3049640275","https://openalex.org/W3100985894","https://openalex.org/W4236853429","https://openalex.org/W4282974189","https://openalex.org/W4306179717","https://openalex.org/W4318541554","https://openalex.org/W4383604511","https://openalex.org/W4385245566","https://openalex.org/W4385571944","https://openalex.org/W4385571951","https://openalex.org/W4385572016","https://openalex.org/W4385572416","https://openalex.org/W4389162698","https://openalex.org/W4389524473","https://openalex.org/W4402670692","https://openalex.org/W4406650295","https://openalex.org/W4410986266","https://openalex.org/W4411630326","https://openalex.org/W6677580257","https://openalex.org/W6732520560","https://openalex.org/W6778883912","https://openalex.org/W6780805062","https://openalex.org/W6784333009","https://openalex.org/W6788811087","https://openalex.org/W6790499563","https://openalex.org/W6793102544","https://openalex.org/W6796854725","https://openalex.org/W6805239564","https://openalex.org/W6810297391","https://openalex.org/W6810737565","https://openalex.org/W6810738896","https://openalex.org/W6838322825","https://openalex.org/W6843384352","https://openalex.org/W6846164622","https://openalex.org/W6847478871","https://openalex.org/W6848451824","https://openalex.org/W6848757079","https://openalex.org/W6850316863","https://openalex.org/W6850619096","https://openalex.org/W6850625674","https://openalex.org/W6851828392","https://openalex.org/W6852962002","https://openalex.org/W6853187832","https://openalex.org/W6853658832","https://openalex.org/W6853804809","https://openalex.org/W6854094408","https://openalex.org/W6854098556","https://openalex.org/W6854308872","https://openalex.org/W6854866820","https://openalex.org/W6855007554","https://openalex.org/W6855125150","https://openalex.org/W6855216553","https://openalex.org/W6855650390","https://openalex.org/W6856693227","https://openalex.org/W6857551316","https://openalex.org/W6857946224","https://openalex.org/W6858205958","https://openalex.org/W6860710830"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2048100608","https://openalex.org/W2090296580","https://openalex.org/W1576249345","https://openalex.org/W4243905374","https://openalex.org/W2785815065","https://openalex.org/W1796074903"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"such":[4],"as":[5],"GPTs":[6],"and":[7,34,44,88,113,179,190,200],"Mixtral-8x7B":[8],"have":[9],"revolutionized":[10],"machine":[11],"intelligence":[12],"due":[13,136],"to":[14,26,115,137],"their":[15,40],"exceptional":[16],"abilities":[17],"in":[18,102],"generic":[19],"ML":[20],"tasks.":[21],"Transiting":[22],"LLMs":[23,64,189],"from":[24],"datacenters":[25],"edge":[27,191],"devices":[28],"brings":[29],"benefits":[30],"like":[31],"better":[32],"privacy":[33],"availability,":[35],"but":[36,133],"is":[37,122],"challenged":[38],"by":[39,90,124],"massive":[41],"parameter":[42,75],"size":[43,76],"thus":[45],"unbearable":[46],"runtime":[47],"costs.":[48],"To":[49,140],"this":[50],"end,":[51],"we":[52],"present":[53],"<monospace":[54,82,148,193],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[55,83,149,194],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">EdgeMoE</monospace>,":[56],"an":[57],"on-device":[58],"inference":[59],"engine":[60],"for":[61],"mixture-of-expert":[62],"(MoE)":[63],"\u2013":[65],"a":[66,125],"popular":[67,187],"form":[68],"of":[69,177],"sparse":[70,138],"LLM":[71],"that":[72,128,159,171],"scales":[73],"its":[74],"with":[77,164,182],"almost":[78],"constant":[79],"computing":[80],"complexity.":[81],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">EdgeMoE</monospace>":[84,150,195],"achieves":[85],"both":[86],"memory-":[87],"compute-efficiency":[89],"partitioning":[91],"the":[92,95,143,161,173,183],"model":[93],"into":[94],"storage":[96,112],"hierarchy:":[97],"non-expert":[98],"weights":[99,107,130],"are":[100,108,131],"held":[101,109],"device":[103],"memory;":[104],"while":[105],"expert":[106,129,144,162,169],"on":[110],"external":[111],"fetched":[114],"memory":[116,198],"only":[117],"when":[118],"activated.":[119],"This":[120],"design":[121],"motivated":[123],"key":[126],"observation":[127],"bulky":[132],"infrequently":[134],"used":[135],"activation.":[139],"further":[141],"reduce":[142],"I/O":[145],"swapping":[146],"overhead,":[147],"incorporates":[151],"two":[152],"novel":[153],"techniques:":[154],"(1)":[155],"expert-wise":[156],"bitwidth":[157],"adaptation":[158],"reduces":[160],"sizes":[163],"tolerable":[165],"accuracy":[166],"loss;":[167],"(2)":[168],"preloading":[170],"predicts":[172],"activated":[174],"experts":[175],"ahead":[176],"time":[178],"preloads":[180],"it":[181],"compute-I/O":[184],"pipeline.":[185],"On":[186],"MoE":[188],"devices,":[192],"showcase":[196],"significant":[197],"savings":[199],"speedup":[201],"over":[202],"competitive":[203],"baselines.":[204]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":8}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
