{"id":"https://openalex.org/W4414898312","doi":"https://doi.org/10.1109/cluster59342.2025.11186486","title":"Deadline-Aware Resource Allocation and Scheduling of Serverless Workloads on Heterogeneous Clusters","display_name":"Deadline-Aware Resource Allocation and Scheduling of Serverless Workloads on Heterogeneous Clusters","publication_year":2025,"publication_date":"2025-09-02","ids":{"openalex":"https://openalex.org/W4414898312","doi":"https://doi.org/10.1109/cluster59342.2025.11186486"},"language":"en","primary_location":{"id":"doi:10.1109/cluster59342.2025.11186486","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cluster59342.2025.11186486","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Cluster Computing (CLUSTER)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015033668","display_name":"Matthias Fritz","orcid":"https://orcid.org/0000-0002-8369-9202"},"institutions":[{"id":"https://openalex.org/I129774422","display_name":"University of Vienna","ror":"https://ror.org/03prydq77","country_code":"AT","type":"education","lineage":["https://openalex.org/I129774422"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Matthias Fritz","raw_affiliation_strings":["University of Vienna,Faculty of Computer Science,Vienna,Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Vienna,Faculty of Computer Science,Vienna,Austria","institution_ids":["https://openalex.org/I129774422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065806871","display_name":"Siegfried Benkner","orcid":"https://orcid.org/0000-0002-6520-2047"},"institutions":[{"id":"https://openalex.org/I129774422","display_name":"University of Vienna","ror":"https://ror.org/03prydq77","country_code":"AT","type":"education","lineage":["https://openalex.org/I129774422"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Siegfried Benkner","raw_affiliation_strings":["University of Vienna,Faculty of Computer Science,Vienna,Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Vienna,Faculty of Computer Science,Vienna,Austria","institution_ids":["https://openalex.org/I129774422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056654204","display_name":"Enes Bajrovi\u0107","orcid":null},"institutions":[{"id":"https://openalex.org/I129774422","display_name":"University of Vienna","ror":"https://ror.org/03prydq77","country_code":"AT","type":"education","lineage":["https://openalex.org/I129774422"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Enes Bajrovic","raw_affiliation_strings":["University of Vienna,Faculty of Computer Science,Vienna,Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Vienna,Faculty of Computer Science,Vienna,Austria","institution_ids":["https://openalex.org/I129774422"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I129774422"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36785909,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9409999847412109,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9409999847412109,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9326000213623047,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9320999979972839,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.7429999709129333},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6740000247955322},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5992000102996826},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.582099974155426},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.48179998993873596},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.38589999079704285},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.37540000677108765},{"id":"https://openalex.org/keywords/live-migration","display_name":"Live migration","score":0.33719998598098755}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8687999844551086},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.7429999709129333},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6740000247955322},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.6146000027656555},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5992000102996826},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.582099974155426},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.48179998993873596},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.38589999079704285},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.37540000677108765},{"id":"https://openalex.org/C2778710394","wikidata":"https://www.wikidata.org/wiki/Q4179813","display_name":"Live migration","level":4,"score":0.33719998598098755},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.33059999346733093},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.32249999046325684},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.31439998745918274},{"id":"https://openalex.org/C2777958785","wikidata":"https://www.wikidata.org/wiki/Q17120940","display_name":"Resource efficiency","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.28630000352859497},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C527821871","wikidata":"https://www.wikidata.org/wiki/Q228502","display_name":"Access control","level":2,"score":0.2793999910354614},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C19012869","wikidata":"https://www.wikidata.org/wiki/Q578372","display_name":"Response time","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.27469998598098755},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2700999975204468},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cluster59342.2025.11186486","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cluster59342.2025.11186486","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Cluster Computing (CLUSTER)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2561596638","https://openalex.org/W2963330479","https://openalex.org/W2963788825","https://openalex.org/W2963974647","https://openalex.org/W3044723004","https://openalex.org/W3047528232","https://openalex.org/W3089365967","https://openalex.org/W3112094022","https://openalex.org/W3116554259","https://openalex.org/W3155705005","https://openalex.org/W3169257120","https://openalex.org/W3188481800","https://openalex.org/W3214103365","https://openalex.org/W4226302867","https://openalex.org/W4283211213","https://openalex.org/W4292973069","https://openalex.org/W4312781266","https://openalex.org/W4402186981"],"related_works":[],"abstract_inverted_index":{"Serverless":[0],"computing":[1],"has":[2],"become":[3],"widely":[4],"adopted":[5],"as":[6,173],"a":[7,44,78,153],"cloud":[8,29],"deployment":[9],"model":[10],"due":[11],"to":[12,28,65,96],"its":[13],"ease":[14],"of":[15],"use":[16],"and":[17,31,47,80,83,105,120,135,168,182],"finegrained":[18],"pay-as-you-go":[19],"pricing.":[20],"By":[21,164],"hiding":[22],"infrastructure":[23],"complexity,":[24],"it":[25,63,114,131],"simplifies":[26],"access":[27],"resources":[30],"lets":[32],"developers":[33],"focus":[34],"on":[35,43,126],"application":[36],"code.":[37],"However,":[38],"most":[39],"serverless":[40,89],"platforms":[41],"operate":[42],"best-effort":[45],"basis":[46],"provide":[48],"minimal":[49],"control":[50],"over":[51],"performance":[52],"tuning.":[53,163],"Combined":[54],"with":[55],"limited":[56],"visibility":[57],"into":[58],"underlying":[59],"hardware,":[60],"this":[61],"makes":[62],"difficult":[64],"reliably":[66],"meet":[67],"Service":[68],"Level":[69],"Objectives":[70],"(SLOs).":[71],"To":[72,111],"address":[73],"this,":[74],"we":[75],"introduce":[76],"DHRT,":[77],"deadline-":[79],"heterogeneity-aware":[81],"scheduling":[82,134],"resource":[84,99,136,150,162,180],"allocation":[85,137],"framework":[86],"for":[87,116,160],"performance-critical":[88],"workloads.":[90],"DHRT":[91,125,147,178],"applies":[92],"heuristic-driven":[93],"online":[94],"optimisation":[95],"iteratively":[97],"refine":[98],"estimates":[100,149],"by":[101,129],"leveraging":[102],"real-time":[103],"metrics":[104],"historical":[106],"data":[107],"from":[108],"live":[109,155],"executions.":[110],"fulfil":[112],"SLOs,":[113],"accounts":[115],"both":[117],"workload":[118],"characteristics":[119],"node":[121,166],"heterogeneity.":[122],"We":[123],"evaluate":[124],"synthetic":[127],"workloads":[128,174],"comparing":[130],"against":[132],"baseline":[133],"policies":[138],"commonly":[139],"used":[140],"in":[141],"FaaS":[142],"platforms.":[143],"Results":[144],"show":[145],"that":[146],"accurately":[148],"demands":[151],"within":[152],"few":[154],"executions,":[156],"eliminating":[157],"the":[158],"need":[159],"manual":[161],"exploiting":[165],"heterogeneity":[167],"dynamically":[169],"scaling":[170],"vCPU":[171],"allocations":[172],"near":[175],"their":[176],"deadlines,":[177],"improves":[179],"efficiency":[181],"significantly":[183],"reduces":[184],"deadline":[185],"violations.":[186]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
