{"id":"https://openalex.org/W7124890111","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331487","title":"Energy Efficient and QoS-Aware Model Selection for DNN Inference in Edge Intelligence","display_name":"Energy Efficient and QoS-Aware Model Selection for DNN Inference in Edge Intelligence","publication_year":2025,"publication_date":"2025-11-14","ids":{"openalex":"https://openalex.org/W7124890111","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331487"},"language":null,"primary_location":{"id":"doi:10.1109/cloudcom67567.2025.11331487","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331487","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087479170","display_name":"Hajar Siar","orcid":"https://orcid.org/0000-0001-7775-6904"},"institutions":[{"id":"https://openalex.org/I90267481","display_name":"Ume\u00e5 University","ror":"https://ror.org/05kb8h459","country_code":"SE","type":"education","lineage":["https://openalex.org/I90267481"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Hajar Siar","raw_affiliation_strings":["Ume&#x00E5; University,Department of Computing Science,Ume&#x00E5;,Sweden"],"affiliations":[{"raw_affiliation_string":"Ume&#x00E5; University,Department of Computing Science,Ume&#x00E5;,Sweden","institution_ids":["https://openalex.org/I90267481"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121184752","display_name":"Erik Elmroth","orcid":null},"institutions":[{"id":"https://openalex.org/I90267481","display_name":"Ume\u00e5 University","ror":"https://ror.org/05kb8h459","country_code":"SE","type":"education","lineage":["https://openalex.org/I90267481"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Erik Elmroth","raw_affiliation_strings":["Ume&#x00E5; University,Department of Computing Science,Ume&#x00E5;,Sweden"],"affiliations":[{"raw_affiliation_string":"Ume&#x00E5; University,Department of Computing Science,Ume&#x00E5;,Sweden","institution_ids":["https://openalex.org/I90267481"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5087479170"],"corresponding_institution_ids":["https://openalex.org/I90267481"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.68683234,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.8162000179290771,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.8162000179290771,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.03240000084042549,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.030799999833106995,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6944000124931335},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.633899986743927},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.6050999760627747},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.5856999754905701},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5838000178337097},{"id":"https://openalex.org/keywords/provisioning","display_name":"Provisioning","score":0.5286999940872192},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4959000051021576},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.4490000009536743},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.430400013923645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7473000288009644},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6944000124931335},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.633899986743927},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.6050999760627747},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5838000178337097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5740000009536743},{"id":"https://openalex.org/C172191483","wikidata":"https://www.wikidata.org/wiki/Q1071806","display_name":"Provisioning","level":2,"score":0.5286999940872192},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4959000051021576},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4724999964237213},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.4490000009536743},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.430400013923645},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3582000136375427},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.34040001034736633},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3336000144481659},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.3086000084877014},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.2809000015258789},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.2782000005245209},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.27790001034736633},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.2644999921321869},{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cloudcom67567.2025.11331487","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331487","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.9058822393417358}],"awards":[],"funders":[{"id":"https://openalex.org/F4320324135","display_name":"Kempestiftelserna","ror":"https://ror.org/05cszw148"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2962814013","https://openalex.org/W2963122961","https://openalex.org/W3004633656","https://openalex.org/W3088405768","https://openalex.org/W3105381414","https://openalex.org/W3210635777","https://openalex.org/W3214897310","https://openalex.org/W4285197124","https://openalex.org/W4312910656","https://openalex.org/W4322153971","https://openalex.org/W4368353274","https://openalex.org/W4387544287","https://openalex.org/W4389098960","https://openalex.org/W4399808146","https://openalex.org/W4402916288","https://openalex.org/W4405129828","https://openalex.org/W4407247167","https://openalex.org/W4413146688"],"related_works":[],"abstract_inverted_index":{"Edge":[0],"intelligence":[1],"is":[2,133],"about":[3],"enabling":[4],"deep":[5],"learning":[6],"applications":[7],"to":[8,120,142],"run":[9],"on":[10,39,69,96],"edge":[11,34,118],"platforms,":[12],"often":[13],"under":[14,135],"strict":[15],"Quality":[16],"of":[17,33,48,62,78,106,110,117,151,166],"Service":[18],"(QoS)":[19],"constraints":[20],"(e.g.,":[21],"deadlines":[22],"and":[23,27,30,93,144,163,171],"accuracy).":[24],"The":[25,130],"heterogeneity":[26],"limited":[28],"computational":[29],"energy":[31,79,123],"capacities":[32],"servers":[35,119],"necessitate":[36],"further":[37],"study":[38],"energy-efficient":[40],"Deep":[41],"Neural":[42],"Network":[43],"(DNN)":[44],"inference.":[45],"While":[46],"availability":[47],"DNN":[49,73],"model":[50,70,90,112],"variants":[51],"enables":[52],"adaptive":[53],"selection":[54,71],"without":[55],"compromising":[56],"accuracy,":[57],"it":[58],"increases":[59],"the":[60,63,104,148,164,175],"complexity":[61],"solution":[64],"space.":[65],"Also,":[66],"existing":[67],"research":[68],"for":[72,88],"inference":[74,128],"lacks":[75],"efficient":[76],"estimation":[77],"consumption.":[80],"This":[81],"paper":[82],"proposes":[83],"a":[84],"polynomial-time":[85],"joint":[86],"strategy":[87,132],"QoS-aware":[89],"instance":[91],"provisioning":[92],"selection,":[94],"based":[95],"many-to-many":[97],"stable":[98],"matching.":[99],"Our":[100],"novel":[101],"formulation":[102],"uses":[103],"number":[105],"floating-point":[107],"operations":[108],"(FLOPs)":[109],"each":[111],"along":[113],"with":[114],"hardware-level":[115],"characteristics":[116],"minimize":[121],"total":[122],"usage":[124],"while":[125],"maximizing":[126],"successful":[127],"completions.":[129],"proposed":[131],"evaluated":[134],"different":[136],"preference":[137],"functions.":[138],"Experimental":[139],"results,":[140],"compared":[141],"optimal":[143],"evolutionary":[145],"algorithms,":[146],"demonstrate":[147],"runtime":[149],"efficiency":[150],"our":[152],"strategy.":[153],"Furthermore,":[154],"extensive":[155],"evaluations":[156],"against":[157],"baselines":[158],"highlights":[159],"its":[160],"superior":[161],"performance":[162],"importance":[165],"jointly":[167],"considering":[168],"both":[169],"system-":[170],"application-level":[172],"parameters":[173],"in":[174],"solution.":[176]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2026-01-21T00:00:00"}
