{"id":"https://openalex.org/W4412164080","doi":"https://doi.org/10.1109/tmc.2025.3586793","title":"Joint DNN Model Deployment, Selection, and Configuration for Heterogeneous Inference Services Toward Edge Intelligence","display_name":"Joint DNN Model Deployment, Selection, and Configuration for Heterogeneous Inference Services Toward Edge Intelligence","publication_year":2025,"publication_date":"2025-07-09","ids":{"openalex":"https://openalex.org/W4412164080","doi":"https://doi.org/10.1109/tmc.2025.3586793"},"language":"en","primary_location":{"id":"doi:10.1109/tmc.2025.3586793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3586793","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102703813","display_name":"Hebin Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I150807315","display_name":"Guangxi University","ror":"https://ror.org/02c9qn167","country_code":"CN","type":"education","lineage":["https://openalex.org/I150807315"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hebin Huang","raw_affiliation_strings":["School of Electrical Engineering, Guangxi Key Laboratory of Multimedia Communications and Network Technology, School of Computer and Electronic Information, Guangxi University, Nanning, China","School of Electrical Engineering and the Guangxi Key Laboratory of Multimedia Communications and Network Technology in the School of Computer and Electronic Information, Guangxi University, Nanning, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Guangxi Key Laboratory of Multimedia Communications and Network Technology, School of Computer and Electronic Information, Guangxi University, Nanning, China","institution_ids":["https://openalex.org/I150807315"]},{"raw_affiliation_string":"School of Electrical Engineering and the Guangxi Key Laboratory of Multimedia Communications and Network Technology in the School of Computer and Electronic Information, Guangxi University, Nanning, China","institution_ids":["https://openalex.org/I150807315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008728640","display_name":"Junbin Liang","orcid":"https://orcid.org/0000-0001-9328-4919"},"institutions":[{"id":"https://openalex.org/I150807315","display_name":"Guangxi University","ror":"https://ror.org/02c9qn167","country_code":"CN","type":"education","lineage":["https://openalex.org/I150807315"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junbin Liang","raw_affiliation_strings":["School of Electrical Engineering, Guangxi Key Laboratory of Multimedia Communications and Network Technology, School of Computer and Electronic Information, Guangxi University, Nanning, China","School of Electrical Engineering and the Guangxi Key Laboratory of Multimedia Communications and Network Technology in the School of Computer and Electronic Information, Guangxi University, Nanning, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Guangxi Key Laboratory of Multimedia Communications and Network Technology, School of Computer and Electronic Information, Guangxi University, Nanning, China","institution_ids":["https://openalex.org/I150807315"]},{"raw_affiliation_string":"School of Electrical Engineering and the Guangxi Key Laboratory of Multimedia Communications and Network Technology in the School of Computer and Electronic Information, Guangxi University, Nanning, China","institution_ids":["https://openalex.org/I150807315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100770003","display_name":"Geyong Min","orcid":"https://orcid.org/0000-0003-1395-7314"},"institutions":[{"id":"https://openalex.org/I23923803","display_name":"University of Exeter","ror":"https://ror.org/03yghzc09","country_code":"GB","type":"education","lineage":["https://openalex.org/I23923803"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Geyong Min","raw_affiliation_strings":["Department of Computer Science, University of Exeter, Exeter, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Exeter, Exeter, U.K","institution_ids":["https://openalex.org/I23923803"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102703813"],"corresponding_institution_ids":["https://openalex.org/I150807315"],"apc_list":null,"apc_paid":null,"fwci":2.3568,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89978628,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"24","issue":"11","first_page":"12726","last_page":"12741"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13018","display_name":"Seismology and Earthquake Studies","score":0.7660999894142151,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13018","display_name":"Seismology and Earthquake Studies","score":0.7660999894142151,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.7656000256538391,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.7138000130653381,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8373531103134155},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.7343277931213379},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.7178356647491455},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6376916170120239},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6373099088668823},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5294774770736694},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41398629546165466},{"id":"https://openalex.org/keywords/model-selection","display_name":"Model selection","score":0.4110180735588074},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.395395427942276},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.38909804821014404},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.13834479451179504},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08166888356208801}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8373531103134155},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.7343277931213379},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.7178356647491455},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6376916170120239},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6373099088668823},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5294774770736694},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41398629546165466},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.4110180735588074},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.395395427942276},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.38909804821014404},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.13834479451179504},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08166888356208801},{"id":"https://openalex.org/C170154142","wikidata":"https://www.wikidata.org/wiki/Q150737","display_name":"Architectural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmc.2025.3586793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3586793","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2335877755","display_name":null,"funder_award_id":"62362005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5039842795","display_name":null,"funder_award_id":"AD25069071","funder_id":"https://openalex.org/F4320336589","funder_display_name":"Guangxi Key Research and Development Program"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336589","display_name":"Guangxi Key Research and Development Program","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W2194775991","https://openalex.org/W2252355370","https://openalex.org/W2767101511","https://openalex.org/W2792220137","https://openalex.org/W2887117815","https://openalex.org/W2894413690","https://openalex.org/W2900394813","https://openalex.org/W2900629482","https://openalex.org/W2950865323","https://openalex.org/W2981657066","https://openalex.org/W3046577719","https://openalex.org/W3047392327","https://openalex.org/W3059280052","https://openalex.org/W3082653258","https://openalex.org/W3094502228","https://openalex.org/W3193397333","https://openalex.org/W4285108785","https://openalex.org/W4285197124","https://openalex.org/W4286377419","https://openalex.org/W4286904999","https://openalex.org/W4302931966","https://openalex.org/W4313068538","https://openalex.org/W4313229583","https://openalex.org/W4377710429","https://openalex.org/W4385575022","https://openalex.org/W4385819926","https://openalex.org/W4386634210","https://openalex.org/W4387544287","https://openalex.org/W4389610351","https://openalex.org/W4395028427","https://openalex.org/W4396604745","https://openalex.org/W4396886469","https://openalex.org/W4399801571","https://openalex.org/W4400487840"],"related_works":["https://openalex.org/W2770234245","https://openalex.org/W96612179","https://openalex.org/W4229499248","https://openalex.org/W2566006169","https://openalex.org/W1567818861","https://openalex.org/W2987774938","https://openalex.org/W4256492088","https://openalex.org/W632915154","https://openalex.org/W2055733372","https://openalex.org/W3022067003"],"abstract_inverted_index":{"Edge":[0],"intelligence":[1],"is":[2,97,103,154],"an":[3,146],"emerging":[4],"paradigm":[5],"in":[6],"edge":[7,17],"computing":[8],"that":[9,72,209],"deploys":[10],"Deep":[11],"Neural":[12],"Network":[13],"(DNN)":[14],"models":[15,62,81],"on":[16],"servers":[18],"with":[19,42],"limited":[20],"storage":[21],"and":[22,32,45,63,79,95,131,151,170,202],"computation":[23],"capacities":[24],"to":[25,107,122,191,197],"provide":[26,67],"inference":[27,70,84,91,135],"services":[28,71,85],"for":[29,133],"high":[30],"mobility":[31],"real-time":[33],"applications,":[34],"such":[35],"as":[36,145,162],"autonomous":[37],"driving":[38],"or":[39,54],"smart":[40],"surveillance,":[41],"varying":[43],"accuracy":[44],"delay":[46,96],"requirements.":[47,75],"Adapting":[48],"application":[49],"configurations":[50,78,201],"(e.g.,":[51],"image":[52],"resolution":[53],"video":[55],"frame":[56],"rate)":[57],"while":[58],"selecting":[59],"different":[60,193,198],"DNN":[61,80,128,203],"deployment":[64,132],"locations":[65],"can":[66],"high-accuracy,":[68],"low-delay":[69],"meet":[73],"user":[74],"However,":[76],"the":[77,109,125,160,210],"of":[82,200],"various":[83],"are":[86],"highly":[87],"heterogeneous.":[88],"As":[89],"balancing":[90],"accuracy,":[92],"resource":[93],"cost,":[94],"a":[98,104,118,163,175],"multi-objective":[99],"programming":[100,149],"problem,":[101],"it":[102,153,172],"great":[105],"challenge":[106],"obtain":[108],"optimal":[110],"solution.":[111],"To":[112],"address":[113],"this":[114,141],"challenge,":[115],"we":[116,138,157],"propose":[117],"novel":[119],"online":[120],"framework":[121],"jointly":[123],"optimize":[124],"configuration":[126],"adaption,":[127],"model":[129,159],"selection,":[130],"heterogeneous":[134],"services.":[136],"Specifically,":[137],"first":[139],"formulate":[140],"joint":[142],"optimization":[143],"problem":[144,150,161],"integer":[147],"linear":[148],"prove":[152],"NP-hard.":[155],"Then,":[156],"further":[158],"Partial":[164],"Observable":[165],"Markov":[166],"Decision":[167],"Process":[168],"(POMDP)":[169],"solve":[171],"by":[173],"developing":[174],"Heterogeneous-Agent":[176],"Reinforcement":[177],"Learning":[178],"(HARL)":[179],"based":[180],"algorithm,":[181],"named":[182],"Heterogeneous":[183],"Inference":[184],"Service":[185],"ProvidER":[186],"(HISPER).":[187],"It":[188],"allows":[189],"agents":[190],"have":[192],"action":[194],"spaces":[195],"corresponding":[196],"types":[199],"models.":[204],"Finally,":[205],"extensive":[206],"experiments":[207],"demonstrate":[208],"proposed":[211],"algorithm":[212],"outperforms":[213],"other":[214],"state-of-the-art":[215],"counterparts.":[216]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
