{"id":"https://openalex.org/W4414170023","doi":"https://doi.org/10.1109/iwqos65803.2025.11143291","title":"MetaPipe: Incremental Deployment of Containerized AI Microservices for Edge Clouds","display_name":"MetaPipe: Incremental Deployment of Containerized AI Microservices for Edge Clouds","publication_year":2025,"publication_date":"2025-07-02","ids":{"openalex":"https://openalex.org/W4414170023","doi":"https://doi.org/10.1109/iwqos65803.2025.11143291"},"language":"en","primary_location":{"id":"doi:10.1109/iwqos65803.2025.11143291","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwqos65803.2025.11143291","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM 33rd International Symposium on Quality of Service (IWQoS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079019595","display_name":"Qixin Li","orcid":"https://orcid.org/0000-0002-8325-5409"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qixin Li","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037920323","display_name":"Xiaoxu Ren","orcid":"https://orcid.org/0000-0002-3166-1405"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxu Ren","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100741750","display_name":"Zhongyuan Wang","orcid":"https://orcid.org/0000-0002-9796-488X"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongyuan Wang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100666106","display_name":"Haipeng Yao","orcid":"https://orcid.org/0000-0003-1391-7363"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haipeng Yao","raw_affiliation_strings":["Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060129988","display_name":"Yuan He","orcid":"https://orcid.org/0000-0002-6676-4009"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan He","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101877971","display_name":"Yunhao Liu","orcid":"https://orcid.org/0000-0002-6262-3313"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunhao Liu","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5079019595"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.29717299,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microservices","display_name":"Microservices","score":0.9138000011444092},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.8902000188827515},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7271000146865845},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6984000205993652},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.673799991607666},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5202999711036682},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5022000074386597},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.49790000915527344}],"concepts":[{"id":"https://openalex.org/C2778505942","wikidata":"https://www.wikidata.org/wiki/Q18344624","display_name":"Microservices","level":3,"score":0.9138000011444092},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.8902000188827515},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7738999724388123},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7271000146865845},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6984000205993652},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.673799991607666},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5202999711036682},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5022000074386597},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.49790000915527344},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.46790000796318054},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4661000072956085},{"id":"https://openalex.org/C9903902","wikidata":"https://www.wikidata.org/wiki/Q3025536","display_name":"DevOps","level":3,"score":0.4357999861240387},{"id":"https://openalex.org/C2780154230","wikidata":"https://www.wikidata.org/wiki/Q513420","display_name":"Undo","level":2,"score":0.3889999985694885},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.3822999894618988},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.38040000200271606},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.35670000314712524},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3262999951839447},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.30149999260902405},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2721000015735626},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26989999413490295},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.26899999380111694},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.26809999346733093}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iwqos65803.2025.11143291","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwqos65803.2025.11143291","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM 33rd International Symposium on Quality of Service (IWQoS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2090244259","https://openalex.org/W2963505890","https://openalex.org/W3132671079","https://openalex.org/W3207744690","https://openalex.org/W4224308066","https://openalex.org/W4226135183","https://openalex.org/W4283206230","https://openalex.org/W4380906046","https://openalex.org/W4386243285","https://openalex.org/W4387561305","https://openalex.org/W4388561289","https://openalex.org/W4396605295","https://openalex.org/W4396620506","https://openalex.org/W4401508100","https://openalex.org/W4405079446"],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"have":[4],"emerged":[5],"as":[6,22,46],"a":[7,23,81],"transformative":[8],"advancement":[9],"in":[10,70,139,146,155],"artificial":[11],"intelligence":[12],"(AI).":[13],"To":[14],"fully":[15],"leverage":[16],"their":[17],"potential,":[18],"Docker":[19],"containers,":[20],"serving":[21],"lightweight,":[24],"portable,":[25],"and":[26,53,89,104,143],"isolated":[27],"framework,":[28],"facilitate":[29],"the":[30,37,110,157],"seamless":[31],"deployment":[32,38,64,98,162],"of":[33,39,159],"LLM-based":[34],"applications.":[35],"However,":[36],"containerized":[40,67],"AI":[41,68,160],"microservices":[42,69,161],"faces":[43],"challenges":[44],"such":[45],"heavy":[47],"network":[48],"loads,":[49],"delayed":[50],"image":[51],"loading,":[52],"redundancy.":[54],"In":[55],"this":[56],"paper,":[57],"we":[58],"introduce":[59],"MetaPipe,":[60],"an":[61],"innovative":[62],"incremental":[63],"approach":[65],"for":[66],"edge":[71,164],"cloud":[72,165],"environments.":[73,166],"MetaPipe":[74,131],"aims":[75],"to":[76],"optimize":[77],"startup":[78,141,148],"times":[79],"through":[80,100],"dynamic":[82],"workflow":[83],"that":[84,130],"incorporates":[85],"proactive":[86,94],"layer":[87,91,101,118],"pre-fetching":[88,95],"reinforcement":[90,111],"re-scheduling.":[92],"The":[93],"reduces":[96],"service":[97],"time":[99,142],"caching":[102],"prediction":[103],"pre-scheduling":[105],"before":[106],"requests":[107,122],"arrive,":[108],"while":[109],"re-scheduling":[112],"addresses":[113],"inaccuracies":[114],"by":[115],"dynamically":[116],"adjusting":[117],"scheduling":[119],"strategies":[120],"after":[121],"arrive.":[123],"Extensive":[124],"experiments":[125],"on":[126],"realworld":[127],"datasets":[128],"show":[129],"significantly":[132],"outperforms":[133],"traditional":[134],"methods,":[135],"achieving":[136],"83.58%":[137],"reduction":[138,145],"initialization":[140],"85.58%":[144],"cold":[147],"time.":[149],"These":[150],"results":[151],"highlight":[152],"its":[153],"effectiveness":[154],"enhancing":[156],"performance":[158],"within":[163]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
