{"id":"https://openalex.org/W3011134162","doi":"https://doi.org/10.1109/jiot.2020.2981338","title":"Joint DNN Partition Deployment and Resource Allocation for Delay-Sensitive Deep Learning Inference in IoT","display_name":"Joint DNN Partition Deployment and Resource Allocation for Delay-Sensitive Deep Learning Inference in IoT","publication_year":2020,"publication_date":"2020-03-17","ids":{"openalex":"https://openalex.org/W3011134162","doi":"https://doi.org/10.1109/jiot.2020.2981338","mag":"3011134162"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2020.2981338","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2020.2981338","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029341326","display_name":"Wenchen He","orcid":"https://orcid.org/0000-0001-8449-1561"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenchen He","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8449-1561","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047467022","display_name":"Shaoyong Guo","orcid":"https://orcid.org/0000-0003-2033-8431"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Shaoyong Guo","raw_affiliation_strings":["Department of Computing and Research Institute for Sustainable Urban Development, Hong Kong Polytechnic University, Hong Kong","State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2033-8431","affiliations":[{"raw_affiliation_string":"Department of Computing and Research Institute for Sustainable Urban Development, Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043464306","display_name":"Song Guo","orcid":"https://orcid.org/0000-0001-9831-2202"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Song Guo","raw_affiliation_strings":["Department of Computing and Research Institute for Sustainable Urban Development, Hong Kong Polytechnic University, Hong Kong","State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9831-2202","affiliations":[{"raw_affiliation_string":"Department of Computing and Research Institute for Sustainable Urban Development, Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042944721","display_name":"Xuesong Qiu","orcid":"https://orcid.org/0000-0002-7899-539X"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuesong Qiu","raw_affiliation_strings":["State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7899-539X","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000744551","display_name":"Feng Qi","orcid":"https://orcid.org/0000-0003-2481-8774"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Qi","raw_affiliation_strings":["Cyberspace Security Research Center, Peng Cheng Laboratory, Shenzhen, China","State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2481-8774","affiliations":[{"raw_affiliation_string":"Cyberspace Security Research Center, Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":12.6416,"has_fulltext":false,"cited_by_count":120,"citation_normalized_percentile":{"value":0.98907339,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"7","issue":"10","first_page":"9241","last_page":"9254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12079","display_name":"IoT Networks and Protocols","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8398712873458862},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4907625615596771},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.48264843225479126},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.4730319678783417},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.46506431698799133},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.43996188044548035},{"id":"https://openalex.org/keywords/mobile-edge-computing","display_name":"Mobile edge computing","score":0.428627610206604},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4254530072212219},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3658466637134552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3521795868873596},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.25049394369125366},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.18897852301597595}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8398712873458862},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4907625615596771},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.48264843225479126},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.4730319678783417},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.46506431698799133},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.43996188044548035},{"id":"https://openalex.org/C2776061582","wikidata":"https://www.wikidata.org/wiki/Q25325231","display_name":"Mobile edge computing","level":3,"score":0.428627610206604},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4254530072212219},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3658466637134552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3521795868873596},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.25049394369125366},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.18897852301597595},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jiot.2020.2981338","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2020.2981338","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-130317","is_oa":false,"landing_page_url":"http://lbdiscover.ust.hk/uresolver?url_ver=Z39.88-2004&rft_val_fmt=info:ofi/fmt:kev:mtx:journal&rfr_id=info:sid/HKUST:SPI&rft.genre=article&rft.issn=2327-4662&rft.volume=7&rft.issue=10&rft.date=2020&rft.spage=9241&rft.aulast=He&rft.aufirst=Wenchen&rft.atitle=Joint+DNN+Partition+Deployment+and+Resource+Allocation+for+Delay-Sensitive+Deep+Learning+Inference+in+IoT&rft.title=IEEE+Internet+of+Things+Journal","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7306596334","display_name":"\u9762\u5411\u6cdb\u5728\u672b\u68a2\u65f6\u53d8\u7f51\u7edc\u7684\u591a\u7ec8\u7aef\u534f\u540c\u673a\u5236","funder_award_id":"61702048","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W2004447163","https://openalex.org/W2043694962","https://openalex.org/W2053491613","https://openalex.org/W2089050596","https://openalex.org/W2142246654","https://openalex.org/W2536587200","https://openalex.org/W2551185505","https://openalex.org/W2605258629","https://openalex.org/W2617931713","https://openalex.org/W2742405391","https://openalex.org/W2757994162","https://openalex.org/W2766731311","https://openalex.org/W2786070938","https://openalex.org/W2786652201","https://openalex.org/W2786839822","https://openalex.org/W2791136298","https://openalex.org/W2792846363","https://openalex.org/W2800182763","https://openalex.org/W2800992211","https://openalex.org/W2804985843","https://openalex.org/W2809251854","https://openalex.org/W2856725472","https://openalex.org/W2891123429","https://openalex.org/W2896180420","https://openalex.org/W2896915209","https://openalex.org/W2903874029","https://openalex.org/W2909267459","https://openalex.org/W2912654452","https://openalex.org/W2913454702","https://openalex.org/W2920031528","https://openalex.org/W2935788212","https://openalex.org/W2950865323","https://openalex.org/W2960833983","https://openalex.org/W2962804345","https://openalex.org/W2962883027","https://openalex.org/W2963821095","https://openalex.org/W2964015972","https://openalex.org/W2964050982","https://openalex.org/W2976382054","https://openalex.org/W2979679572","https://openalex.org/W2980856918","https://openalex.org/W3005801438","https://openalex.org/W3104248904","https://openalex.org/W4235435541","https://openalex.org/W6727151142"],"related_works":["https://openalex.org/W2092530219","https://openalex.org/W2388464034","https://openalex.org/W2533125852","https://openalex.org/W2140460949","https://openalex.org/W3139051647","https://openalex.org/W2902693277","https://openalex.org/W4378977105","https://openalex.org/W2796352555","https://openalex.org/W4318952366","https://openalex.org/W3214829569"],"abstract_inverted_index":{"Nowadays,":[0],"the":[1,36,44,50,73,90,104,124,135,159,164,184,188,196,205],"widely":[2],"used":[3],"Internet-of-Things":[4],"(IoT)":[5],"mobile":[6],"devices":[7],"(MDs)":[8],"generate":[9],"huge":[10],"volumes":[11],"of":[12,76,95,114],"data,":[13],"which":[14],"need":[15],"analyzing":[16],"and":[17,49,82,117,150,177,202],"extracting":[18],"accurate":[19],"information":[20],"in":[21,60,98,120,187],"real":[22],"time":[23],"by":[24,209],"compute-intensive":[25],"deep":[26,37],"learning":[27],"(DL)":[28],"inference":[29,93],"tasks.":[30],"Due":[31],"to":[32,56,88,163,182],"its":[33],"multilayer":[34],"structure,":[35],"neural":[38],"network":[39],"(DNN)":[40],"is":[41,126],"appropriate":[42],"for":[43,64],"mobile-edge":[45],"computing":[46,140],"(MEC)":[47],"environment,":[48],"DL":[51,77,96],"tasks":[52,78,97],"can":[53,203],"be":[54],"offloaded":[55],"DNN":[57,100,152],"partitions":[58],"deployed":[59],"MEC":[61],"servers":[62],"(MECSs)":[63],"speed-up":[65],"inference.":[66],"In":[67],"this":[68],"article,":[69],"we":[70,107,133,168],"first":[71],"assume":[72],"arrival":[74],"process":[75],"as":[79],"Poisson":[80],"distribution":[81],"develop":[83,108],"a":[84,109,127,139,151,170,178],"tandem":[85],"queueing":[86],"model":[87,113],"evaluate":[89],"end-to-end":[91],"(E2E)":[92],"delay":[94,208],"multiple":[99],"partitions.":[101],"To":[102],"minimize":[103],"E2E":[105,207],"delay,":[106],"joint":[110],"optimization":[111],"problem":[112,137,144,156],"partition":[115,147,153],"deployment":[116,148,154],"resource":[118,141],"allocation":[119,142],"MECSs":[121],"(JPDRA).":[122],"Since":[123],"JPDRA":[125],"mixed-integer":[128],"nonlinear":[129],"programming":[130],"(MINLP)":[131],"problem,":[132],"decompose":[134],"original":[136],"into":[138],"(CRA)":[143],"with":[145,211],"fixed":[146],"decision":[149],"(DPD)":[155],"that":[157,195],"optimizes":[158],"optimal-delay":[160],"function":[161],"related":[162],"CRA":[165,171],"problem.":[166],"Next,":[167],"design":[169],"algorithm":[172,181],"based":[173],"on":[174],"Markov":[175],"approximation":[176],"low-complexity":[179],"DPD":[180],"obtain":[183],"near-optimal":[185],"solution":[186],"polynomial":[189],"time.":[190],"The":[191],"simulation":[192],"results":[193],"demonstrate":[194],"proposed":[197],"algorithms":[198],"are":[199],"more":[200],"efficient":[201],"reduce":[204],"average":[206],"25.7%":[210],"better":[212],"convergence":[213],"performance.":[214]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":22},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":32},{"year":2022,"cited_by_count":25},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
