{"id":"https://openalex.org/W4289821779","doi":"https://doi.org/10.1109/tpds.2022.3195664","title":"HiTDL: High-Throughput Deep Learning Inference at the Hybrid Mobile Edge","display_name":"HiTDL: High-Throughput Deep Learning Inference at the Hybrid Mobile Edge","publication_year":2022,"publication_date":"2022-08-05","ids":{"openalex":"https://openalex.org/W4289821779","doi":"https://doi.org/10.1109/tpds.2022.3195664"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2022.3195664","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3195664","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.vu.nl/en/publications/420758f3-e166-4c92-8d6d-1b8506cbd7bb","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067494599","display_name":"Jing Wu","orcid":"https://orcid.org/0000-0003-2555-0220"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jing Wu","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100403099","display_name":"Lin Wang","orcid":"https://orcid.org/0000-0001-7181-6128"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I865915315","display_name":"Vrije Universiteit Amsterdam","ror":"https://ror.org/008xxew50","country_code":"NL","type":"education","lineage":["https://openalex.org/I865915315"]}],"countries":["DE","NL"],"is_corresponding":false,"raw_author_name":"Lin Wang","raw_affiliation_strings":["VU Amsterdam, Amsterdam, The Netherlands","TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"VU Amsterdam, Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I865915315"]},{"raw_affiliation_string":"TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006710277","display_name":"Qiangyu Pei","orcid":"https://orcid.org/0000-0001-8870-4309"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiangyu Pei","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049563917","display_name":"Xingqi Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingqi Cui","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048398271","display_name":"Fangming Liu","orcid":"https://orcid.org/0000-0002-8570-1345"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangming Liu","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101931429","display_name":"Tingting Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingting Yang","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5067494599"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":5.3082,"has_fulltext":false,"cited_by_count":52,"citation_normalized_percentile":{"value":0.96855817,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"33","issue":"12","first_page":"4499","last_page":"4514"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8424615859985352},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6320668458938599},{"id":"https://openalex.org/keywords/provisioning","display_name":"Provisioning","score":0.5521256327629089},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5515918731689453},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5505063533782959},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.5442209243774414},{"id":"https://openalex.org/keywords/knapsack-problem","display_name":"Knapsack problem","score":0.5030414462089539},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.48413023352622986},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4718344807624817},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.4383507966995239},{"id":"https://openalex.org/keywords/mobile-edge-computing","display_name":"Mobile edge computing","score":0.4344486594200134},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.34574228525161743},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2446669042110443},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15645194053649902},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.1461581587791443},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.10728183388710022},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.0885530412197113}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8424615859985352},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6320668458938599},{"id":"https://openalex.org/C172191483","wikidata":"https://www.wikidata.org/wiki/Q1071806","display_name":"Provisioning","level":2,"score":0.5521256327629089},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5515918731689453},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5505063533782959},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.5442209243774414},{"id":"https://openalex.org/C113138325","wikidata":"https://www.wikidata.org/wiki/Q864457","display_name":"Knapsack problem","level":2,"score":0.5030414462089539},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.48413023352622986},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4718344807624817},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.4383507966995239},{"id":"https://openalex.org/C2776061582","wikidata":"https://www.wikidata.org/wiki/Q25325231","display_name":"Mobile edge computing","level":3,"score":0.4344486594200134},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.34574228525161743},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2446669042110443},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15645194053649902},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.1461581587791443},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.10728183388710022},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.0885530412197113},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/tpds.2022.3195664","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3195664","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},{"id":"pmh:oai:research.vu.nl:openaire/420758f3-e166-4c92-8d6d-1b8506cbd7bb","is_oa":true,"landing_page_url":"https://research.vu.nl/en/publications/420758f3-e166-4c92-8d6d-1b8506cbd7bb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Wu, J, Wang, L, Pei, Q, Cui, X, Liu, F & Yang, T 2022, 'HiTDL : High-Throughput Deep Learning Inference at the Hybrid Mobile Edge', IEEE Transactions on Parallel and Distributed Systems, vol. 33, no. 12, pp. 4499-4514. https://doi.org/10.1109/TPDS.2022.3195664","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:research.vu.nl:openaire_cris_publications/420758f3-e166-4c92-8d6d-1b8506cbd7bb","is_oa":true,"landing_page_url":"https://hdl.handle.net/1871.1/420758f3-e166-4c92-8d6d-1b8506cbd7bb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Wu, J, Wang, L, Pei, Q, Cui, X, Liu, F & Yang, T 2022, 'HiTDL : High-Throughput Deep Learning Inference at the Hybrid Mobile Edge', IEEE Transactions on Parallel and Distributed Systems, vol. 33, no. 12, pp. 4499-4514. https://doi.org/10.1109/TPDS.2022.3195664","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:research.vu.nl:publications/420758f3-e166-4c92-8d6d-1b8506cbd7bb","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85135735546&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Wu, J, Wang, L, Pei, Q, Cui, X, Liu, F & Yang, T 2022, 'HiTDL : High-Throughput Deep Learning Inference at the Hybrid Mobile Edge', IEEE Transactions on Parallel and Distributed Systems, vol. 33, no. 12, pp. 4499-4514. https://doi.org/10.1109/TPDS.2022.3195664","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:research.vu.nl:openaire/420758f3-e166-4c92-8d6d-1b8506cbd7bb","is_oa":true,"landing_page_url":"https://research.vu.nl/en/publications/420758f3-e166-4c92-8d6d-1b8506cbd7bb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401107","display_name":"VU Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I865915315","host_organization_name":"Vrije Universiteit Amsterdam","host_organization_lineage":["https://openalex.org/I865915315"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Wu, J, Wang, L, Pei, Q, Cui, X, Liu, F & Yang, T 2022, 'HiTDL : High-Throughput Deep Learning Inference at the Hybrid Mobile Edge', IEEE Transactions on Parallel and Distributed Systems, vol. 33, no. 12, pp. 4499-4514. https://doi.org/10.1109/TPDS.2022.3195664","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"score":0.6200000047683716,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[{"id":"https://openalex.org/G1723849911","display_name":null,"funder_award_id":"1053 MAKI","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G7434893301","display_name":null,"funder_award_id":"61520106005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G75260446","display_name":null,"funder_award_id":"61761136014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1486643454","https://openalex.org/W1608877958","https://openalex.org/W2062761494","https://openalex.org/W2163605009","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2302255633","https://openalex.org/W2605258629","https://openalex.org/W2625567284","https://openalex.org/W2736071714","https://openalex.org/W2773258530","https://openalex.org/W2789383786","https://openalex.org/W2872933037","https://openalex.org/W2883830791","https://openalex.org/W2885829265","https://openalex.org/W2892365986","https://openalex.org/W2896985569","https://openalex.org/W2897460799","https://openalex.org/W2906007643","https://openalex.org/W2917087921","https://openalex.org/W2920031528","https://openalex.org/W2921965200","https://openalex.org/W2928897890","https://openalex.org/W2955425717","https://openalex.org/W2955888259","https://openalex.org/W2956461999","https://openalex.org/W2962677625","https://openalex.org/W2962883027","https://openalex.org/W2963149401","https://openalex.org/W2964108773","https://openalex.org/W2964350391","https://openalex.org/W2965289829","https://openalex.org/W2969388332","https://openalex.org/W2981114133","https://openalex.org/W2983440318","https://openalex.org/W2986646794","https://openalex.org/W2989368243","https://openalex.org/W2991040477","https://openalex.org/W2996942942","https://openalex.org/W3008356843","https://openalex.org/W3015584167","https://openalex.org/W3017194848","https://openalex.org/W3030408490","https://openalex.org/W3041735433","https://openalex.org/W3049640275","https://openalex.org/W3095488153","https://openalex.org/W3097411828","https://openalex.org/W3101104221","https://openalex.org/W3102767875","https://openalex.org/W3121702752","https://openalex.org/W3130378779","https://openalex.org/W3172857592","https://openalex.org/W4297775537","https://openalex.org/W4385245566","https://openalex.org/W6684191040","https://openalex.org/W6686164453","https://openalex.org/W6730956707","https://openalex.org/W6737664043","https://openalex.org/W6739901393","https://openalex.org/W6746361056","https://openalex.org/W6748019619","https://openalex.org/W6753991380","https://openalex.org/W6754743415","https://openalex.org/W6756718674","https://openalex.org/W6760696709","https://openalex.org/W6762718338","https://openalex.org/W6765484274","https://openalex.org/W6778330239"],"related_works":["https://openalex.org/W241127407","https://openalex.org/W2381035939","https://openalex.org/W2468477307","https://openalex.org/W2910645127","https://openalex.org/W162895179","https://openalex.org/W1521824362","https://openalex.org/W2168163332","https://openalex.org/W3139051647","https://openalex.org/W2902693277","https://openalex.org/W4378977105"],"abstract_inverted_index":{"Deep":[0],"neural":[1],"networks":[2],"(DNNs)":[3],"have":[4],"become":[5],"a":[6,36,100,173,206,215],"critical":[7],"component":[8],"for":[9,84,103,146,182,201],"inference":[10,31,148],"in":[11,71],"modern":[12],"mobile":[13,62],"applications,":[14],"but":[15],"the":[16,30,41,44,48,56,61,64,68,72,109,113,125,198,222,226,233],"efficient":[17],"provisioning":[18],"of":[19,43,128,175,225],"DNNs":[20,106],"is":[21,81,117],"non-trivial.":[22],"Existing":[23],"mobile-":[24],"and":[25,54,63,150,163],"server-based":[26],"approaches":[27],"compromise":[28],"either":[29],"accuracy":[32],"or":[33],"latency.":[34],"Instead,":[35],"hybrid":[37,73,110],"approach":[38,74,111],"can":[39],"reap":[40],"benefits":[42],"two":[45,57],"by":[46,123,193,228],"splitting":[47],"DNN":[49,69,147,160,203],"at":[50,112],"an":[51],"appropriate":[52],"layer":[53],"running":[55],"parts":[58],"separately":[59],"on":[60,214],"server":[65],"respectively.":[66],"Nevertheless,":[67],"throughput":[70,127,224],"has":[75],"not":[76],"been":[77],"carefully":[78],"examined,":[79],"which":[80],"particularly":[82],"important":[83],"edge":[85,120,227],"servers":[86],"where":[87],"limited":[88],"compute":[89],"resources":[90],"are":[91],"shared":[92],"among":[93],"multiple":[94,105,155],"DNNs.":[95],"This":[96],"article":[97],"presents":[98],"HiTDL,":[99],"runtime":[101],"framework":[102],"managing":[104],"provisioned":[107],"following":[108],"edge.":[114],"HiTDL's":[115],"mission":[116],"to":[118,154,171],"improve":[119],"resource":[121,158,190],"efficiency":[122],"optimizing":[124],"combined":[126],"all":[129],"co-located":[130],"DNNs,":[131],"while":[132],"still":[133],"guaranteeing":[134],"their":[135],"SLAs.":[136],"To":[137],"this":[138],"end,":[139],"HiTDL":[140,166,186,220],"first":[141],"builds":[142],"comprehensive":[143],"performance":[144],"models":[145,170],"latency":[149],"throughout":[151],"with":[152,179,232],"respect":[153],"factors":[156],"including":[157],"availability,":[159],"partition":[161,177,195],"plan,":[162],"cross-DNN":[164],"interference.":[165],"then":[167],"uses":[168],"these":[169],"generate":[172],"set":[174,200],"candidate":[176,199],"plans":[178,196],"SLA":[180],"guarantees":[181],"each":[183,202],"DNN.":[184],"Finally,":[185],"makes":[187],"global":[188],"throughput-optimal":[189],"allocation":[191],"decisions":[192],"selecting":[194],"from":[197],"via":[204],"solving":[205],"fairness-aware":[207],"multiple-choice":[208],"knapsack":[209],"problem.":[210],"Experimental":[211],"results":[212],"based":[213],"prototype":[216],"implementation":[217],"show":[218],"that":[219],"improves":[221],"overall":[223],"<inline-formula><tex-math":[229],"notation=\"LaTeX\">$4.3\\times$</tex-math></inline-formula>":[230],"compared":[231],"state-of-the-art.":[234]},"counts_by_year":[{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":26},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
