{"id":"https://openalex.org/W3186289964","doi":"https://doi.org/10.1145/3460352","title":"SLO-Aware Inference Scheduler for Heterogeneous Processors in Edge Platforms","display_name":"SLO-Aware Inference Scheduler for Heterogeneous Processors in Edge Platforms","publication_year":2021,"publication_date":"2021-07-17","ids":{"openalex":"https://openalex.org/W3186289964","doi":"https://doi.org/10.1145/3460352","mag":"3186289964"},"language":"en","primary_location":{"id":"doi:10.1145/3460352","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3460352","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3460352","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3460352","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034451791","display_name":"Wonik Seo","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Wonik Seo","raw_affiliation_strings":["KAIST, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"KAIST, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017067532","display_name":"Sang-Hoon Cha","orcid":"https://orcid.org/0000-0002-7231-8291"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sanghoon Cha","raw_affiliation_strings":["Samsung Advanced Institute of Technology, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Advanced Institute of Technology, Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006429670","display_name":"Yeonjae Kim","orcid":"https://orcid.org/0000-0003-4144-9077"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yeonjae Kim","raw_affiliation_strings":["KAIST, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"KAIST, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047149607","display_name":"Jaehyuk Huh","orcid":"https://orcid.org/0000-0002-1742-047X"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaehyuk Huh","raw_affiliation_strings":["KAIST, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"KAIST, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037553165","display_name":"Jongse Park","orcid":"https://orcid.org/0000-0002-6629-449X"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jongse Park","raw_affiliation_strings":["KAIST, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"KAIST, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5034451791"],"corresponding_institution_ids":["https://openalex.org/I157485424"],"apc_list":null,"apc_paid":null,"fwci":4.6428,"has_fulltext":true,"cited_by_count":48,"citation_normalized_percentile":{"value":0.94860982,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"18","issue":"4","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.875079870223999},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6225108504295349},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.6153185963630676},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.5833348035812378},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.569591760635376},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5577173233032227},{"id":"https://openalex.org/keywords/preemption","display_name":"Preemption","score":0.5040990114212036},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.49547016620635986},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.49197718501091003},{"id":"https://openalex.org/keywords/computation-offloading","display_name":"Computation offloading","score":0.47047239542007446},{"id":"https://openalex.org/keywords/symmetric-multiprocessor-system","display_name":"Symmetric multiprocessor system","score":0.4402575194835663},{"id":"https://openalex.org/keywords/data-center","display_name":"Data center","score":0.4341070353984833},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.4222617447376251},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.29692935943603516},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.28221434354782104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22809401154518127},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.17062872648239136},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.14749675989151},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10556396842002869},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.09876120090484619}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.875079870223999},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6225108504295349},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.6153185963630676},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.5833348035812378},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.569591760635376},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5577173233032227},{"id":"https://openalex.org/C206952183","wikidata":"https://www.wikidata.org/wiki/Q1193100","display_name":"Preemption","level":2,"score":0.5040990114212036},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.49547016620635986},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.49197718501091003},{"id":"https://openalex.org/C2781041963","wikidata":"https://www.wikidata.org/wiki/Q18348618","display_name":"Computation offloading","level":4,"score":0.47047239542007446},{"id":"https://openalex.org/C172430144","wikidata":"https://www.wikidata.org/wiki/Q17111997","display_name":"Symmetric multiprocessor system","level":2,"score":0.4402575194835663},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.4341070353984833},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.4222617447376251},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.29692935943603516},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.28221434354782104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22809401154518127},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.17062872648239136},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.14749675989151},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10556396842002869},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.09876120090484619},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3460352","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3460352","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3460352","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3460352","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3460352","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3460352","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.9200000166893005,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G12967831","display_name":null,"funder_award_id":"IITP2017-0-00466","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G1739134435","display_name":null,"funder_award_id":"IITP-","funder_id":"https://openalex.org/F4320324891","funder_display_name":"Iran Telecommunication Research Center"},{"id":"https://openalex.org/G2530816367","display_name":null,"funder_award_id":"2017-0-00466","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G7021487728","display_name":null,"funder_award_id":"NRF-2020R1A2C1103088","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G8945926587","display_name":null,"funder_award_id":"IITP-2021-2020-0-01795","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"},{"id":"https://openalex.org/G982292920","display_name":null,"funder_award_id":"NRF-20","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320324891","display_name":"Iran Telecommunication Research Center","ror":"https://ror.org/01a3g2z22"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"},{"id":"https://openalex.org/F4320335489","display_name":"Institute for Information and Communications Technology Promotion","ror":"https://ror.org/01g0hqq23"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3186289964.pdf","grobid_xml":"https://content.openalex.org/works/W3186289964.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W95608104","https://openalex.org/W1677182931","https://openalex.org/W1972916106","https://openalex.org/W1989099984","https://openalex.org/W2002478203","https://openalex.org/W2016531398","https://openalex.org/W2034181225","https://openalex.org/W2092877006","https://openalex.org/W2119112357","https://openalex.org/W2136849599","https://openalex.org/W2167866796","https://openalex.org/W2191835017","https://openalex.org/W2194775991","https://openalex.org/W2583993537","https://openalex.org/W2604514113","https://openalex.org/W2610406889","https://openalex.org/W2623902153","https://openalex.org/W2626129225","https://openalex.org/W2734941459","https://openalex.org/W2772526503","https://openalex.org/W2787114603","https://openalex.org/W2794670651","https://openalex.org/W2807807191","https://openalex.org/W2903254051","https://openalex.org/W2906791813","https://openalex.org/W2911595481","https://openalex.org/W2914398499","https://openalex.org/W2922395136","https://openalex.org/W2928897890","https://openalex.org/W2931092525","https://openalex.org/W2931743911","https://openalex.org/W2950340157","https://openalex.org/W2963728985","https://openalex.org/W2971002981","https://openalex.org/W2979359324","https://openalex.org/W2982157693","https://openalex.org/W2984200518","https://openalex.org/W2990894474","https://openalex.org/W3007788310","https://openalex.org/W3016842236","https://openalex.org/W3016939927","https://openalex.org/W3034544214","https://openalex.org/W3047401492","https://openalex.org/W3100944043","https://openalex.org/W3105888187","https://openalex.org/W4231332361","https://openalex.org/W4234552385","https://openalex.org/W4235662038","https://openalex.org/W4236099117","https://openalex.org/W4236853429"],"related_works":["https://openalex.org/W3191866865","https://openalex.org/W840708677","https://openalex.org/W2361541374","https://openalex.org/W1439300391","https://openalex.org/W1970491116","https://openalex.org/W2888133284","https://openalex.org/W1570112753","https://openalex.org/W601696587","https://openalex.org/W4360764806","https://openalex.org/W3010050046"],"abstract_inverted_index":{"With":[0],"the":[1,9,56,67,111,116,136,144,147,158,167,174,184,200,207,221],"proliferation":[2],"of":[3,11,69,98,106,124,138,150,186],"applications":[4],"with":[5,34],"machine":[6,71,89],"learning":[7,72,90],"(ML),":[8],"importance":[10],"edge":[12,29,63,117,132],"platforms":[13,30],"has":[14],"been":[15],"growing":[16],"to":[17,25,55,86,92,157,165,215],"process":[18],"streaming":[19],"sensor,":[20],"data":[21,57],"locally":[22],"without":[23],"resorting":[24],"remote":[26],"servers.":[27,59],"Such":[28],"are":[31,51],"commonly":[32],"equipped":[33],"heterogeneous":[35,88,93],"computing":[36,94],"processors":[37],"such":[38,181],"as":[39,61],"GPU,":[40],"DSP,":[41],"and":[42,48,154,191],"other":[43],"accelerators,":[44],"but":[45],"their":[46],"computational":[47],"energy":[49,175],"budget":[50],"severely":[52],"constrained":[53],"compared":[54],"center":[58],"However,":[60],"an":[62],"platform":[64],"must":[65,101],"perform":[66],"processing":[68,97],"multiple":[70],"models":[73],"concurrently":[74],"for":[75,115,131,177],"multimodal":[76],"sensor":[77],"data,":[78],"its":[79,194,218],"scheduling":[80,112,129],"problem":[81],"poses":[82],"a":[83,103,122,204,211],"new":[84,125],"challenge":[85,185],"map":[87],"computation":[91,139,188],"processors.":[95,161],"Furthermore,":[96],"each":[99,151,178],"input":[100],"provide":[102],"certain":[104],"level":[105],"bounded":[107],"response":[108],"latency,":[109],"making":[110],"decision":[113],"critical":[114],"platform.":[118],"This":[119],"article":[120],"proposes":[121],"set":[123],"heterogeneity-aware":[126],"ML":[127,142,152,187,213],"inference":[128],"policies":[130],"platforms.":[133],"Based":[134],"on":[135,189],"regularity":[137],"in":[140,220],"common":[141],"tasks,":[143],"scheduler":[145,209],"uses":[146],"pre-profiled":[148],"behavior":[149],"model":[153],"routes":[155],"requests":[156],"most":[159],"appropriate":[160],"It":[162],"also":[163],"aims":[164],"satisfy":[166],"service-level":[168],"objective":[169],"(SLO)":[170],"requirement":[171],"while":[172],"reducing":[173],"consumption":[176],"request.":[179],"For":[180],"SLO":[182],"supports,":[183],"GPUs":[190],"DSP":[192],"is":[193],"inflexible":[195],"preemption":[196],"capability.":[197],"To":[198],"avoid":[199],"delay":[201],"caused":[202],"by":[203,217],"long":[205],"task,":[206],"proposed":[208],"decomposes":[210],"large":[212],"task":[214],"sub-tasks":[216],"layer":[219],"DNN":[222],"model.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
