{"id":"https://openalex.org/W4414538416","doi":"https://doi.org/10.1109/icc52391.2025.11161045","title":"Towards Expert Models Deployment Cost Optimization in Edge Computing Networks","display_name":"Towards Expert Models Deployment Cost Optimization in Edge Computing Networks","publication_year":2025,"publication_date":"2025-06-08","ids":{"openalex":"https://openalex.org/W4414538416","doi":"https://doi.org/10.1109/icc52391.2025.11161045"},"language":"en","primary_location":{"id":"doi:10.1109/icc52391.2025.11161045","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icc52391.2025.11161045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICC 2025 - IEEE International Conference on Communications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103174120","display_name":"Jiaqi Ren","orcid":"https://orcid.org/0000-0002-1562-7135"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaqi Ren","raw_affiliation_strings":["School of Computing and Artificial Intelligence, Southwest Jiaotong University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computing and Artificial Intelligence, Southwest Jiaotong University,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115596972","display_name":"Chao Wang","orcid":"https://orcid.org/0009-0007-3911-4645"},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chao Wang","raw_affiliation_strings":["Georgia State University,Department of Computer Science,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia State University,Department of Computer Science,USA","institution_ids":["https://openalex.org/I181565077"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006869296","display_name":"Yihan Zhong","orcid":"https://orcid.org/0000-0002-1462-3642"},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yihan Zhong","raw_affiliation_strings":["Georgia State University,Department of Computer Science,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia State University,Department of Computer Science,USA","institution_ids":["https://openalex.org/I181565077"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043877842","display_name":"Shaohua Cao","orcid":"https://orcid.org/0000-0001-8287-2942"},"institutions":[{"id":"https://openalex.org/I4210162190","display_name":"China University of Petroleum, East China","ror":"https://ror.org/05gbn2817","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210162190"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaohua Cao","raw_affiliation_strings":["College of Computer Science and Technology, China University of Petroleum (East China),Qingdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, China University of Petroleum (East China),Qingdao,China","institution_ids":["https://openalex.org/I4210162190"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079356223","display_name":"Danyang Zheng","orcid":"https://orcid.org/0000-0002-3031-7856"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Danyang Zheng","raw_affiliation_strings":["School of Computing and Artificial Intelligence, Southwest Jiaotong University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computing and Artificial Intelligence, Southwest Jiaotong University,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069042354","display_name":"Xiaojun Cao","orcid":"https://orcid.org/0000-0001-5670-8196"},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaojun Cao","raw_affiliation_strings":["Georgia State University,Department of Computer Science,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia State University,Department of Computer Science,USA","institution_ids":["https://openalex.org/I181565077"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5103174120"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":1.3335,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8580647,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"838","last_page":"843"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9266999959945679,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9266999959945679,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11891","display_name":"Big Data and Business Intelligence","score":0.9175999760627747,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.921500027179718},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.6460000276565552},{"id":"https://openalex.org/keywords/expert-system","display_name":"Expert system","score":0.582099974155426},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4934000074863434},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.46160000562667847},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.37869998812675476},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.36500000953674316}],"concepts":[{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.921500027179718},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6888999938964844},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.6460000276565552},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.582099974155426},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4934000074863434},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.46160000562667847},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3971000015735626},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.37869998812675476},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.36500000953674316},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.35589998960494995},{"id":"https://openalex.org/C105002631","wikidata":"https://www.wikidata.org/wiki/Q4833645","display_name":"Subject-matter expert","level":3,"score":0.35569998621940613},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.335099995136261},{"id":"https://openalex.org/C126831891","wikidata":"https://www.wikidata.org/wiki/Q221673","display_name":"Host (biology)","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2939999997615814},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C3017813396","wikidata":"https://www.wikidata.org/wiki/Q17078173","display_name":"Resource constraints","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.26420000195503235},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icc52391.2025.11161045","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icc52391.2025.11161045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICC 2025 - IEEE International Conference on Communications","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2915584714","display_name":null,"funder_award_id":"62302404","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W3192709954","https://openalex.org/W4386025630","https://openalex.org/W4386232099","https://openalex.org/W4389519294","https://openalex.org/W4392297945","https://openalex.org/W4396790588","https://openalex.org/W4401024183","https://openalex.org/W4403257136","https://openalex.org/W4403320241"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,84,91,115,167],"widespread":[2],"adoption":[3],"of":[4,106,172,178],"large":[5],"language":[6],"models":[7,59,102,117,149,156],"(LLMs)":[8],"like":[9],"GPT,":[10],"user":[11],"experiences":[12],"in":[13,119,176],"various":[14],"interactive":[15],"applications":[16],"have":[17],"significantly":[18],"improved.":[19],"However,":[20],"reports":[21],"from":[22,103],"OpenAI":[23],"highlight":[24],"that":[25,163],"GPT":[26,58],"clients":[27],"are":[28,55],"now":[29],"facing":[30],"high":[31],"response":[32],"delays":[33],"and":[34,67,150,174],"frequent":[35],"interruptions,":[36],"particularly":[37],"during":[38],"peak":[39],"usage":[40],"hours,":[41],"due":[42],"to":[43,51,75,81,98,146],"limited":[44],"computation":[45],"resources.":[46],"This":[47,88],"challenge":[48],"is":[49,74],"expected":[50],"escalate":[52],"as":[53],"machines":[54],"interacting":[56],"with":[57,63],"at":[60,95],"higher":[61],"frequencies,":[62],"greater":[64],"data":[65],"volumes,":[66],"over":[68],"longer":[69],"lifecycles.":[70],"A":[71],"promising":[72],"solution":[73],"deploy":[76,100],"LLMs":[77],"across":[78],"edge":[79,111,120],"networks":[80,121],"efficiently":[82],"distribute":[83],"huge":[85],"resource":[86],"demands.":[87],"work":[89],"presents":[90],"very":[92],"first":[93],"efforts":[94],"exploring":[96],"how":[97],"cost-effectively":[99],"expert":[101,116,148,155],"a":[104,134,152],"mixture":[105],"experts":[107],"(MoE)":[108],"LLM":[109],"within":[110],"networks.":[112],"We":[113],"introduce":[114],"deployment":[118,127,157,179],"(EMD-EN)":[122],"problem,":[123],"focusing":[124],"on":[125],"optimizing":[126],"costs.":[128],"To":[129],"address":[130],"this,":[131],"we":[132],"propose":[133],"novel":[135],"least":[136],"cost":[137,180],"gain":[138],"(LCG)":[139],"measure":[140],"for":[141],"selecting":[142],"appropriate":[143],"physical":[144],"nodes":[145],"host":[147],"present":[151],"corresponding":[153],"LCG-based":[154],"(LCGEMD)":[158],"algorithm.":[159],"Extensive":[160],"simulations":[161],"show":[162],"our":[164],"approach":[165],"outperforms":[166],"benchmarks":[168],"by":[169],"an":[170],"average":[171],"17.31%":[173],"36.98%":[175],"terms":[177],"reduction.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-10-10T00:00:00"}
