{"id":"https://openalex.org/W7151315206","doi":"https://doi.org/10.1109/icmla66185.2025.00070","title":"SLA-MORL: SLA-Aware Multi-Objective Reinforcement Learning for HPC Resource Optimization","display_name":"SLA-MORL: SLA-Aware Multi-Objective Reinforcement Learning for HPC Resource Optimization","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7151315206","doi":"https://doi.org/10.1109/icmla66185.2025.00070"},"language":null,"primary_location":{"id":"doi:10.1109/icmla66185.2025.00070","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00070","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009690297","display_name":"Seraj Al Mahmud Mostafa","orcid":null},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Seraj Al Mahmud Mostafa","raw_affiliation_strings":["University of Maryland, Baltimore County,Department of Information Systems,Baltimore,MD,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, Baltimore County,Department of Information Systems,Baltimore,MD,USA","institution_ids":["https://openalex.org/I79272384"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088291022","display_name":"Aravind Mohan","orcid":"https://orcid.org/0000-0003-3621-4716"},"institutions":[{"id":"https://openalex.org/I78157498","display_name":"McMurry University","ror":"https://ror.org/045x76g34","country_code":"US","type":"education","lineage":["https://openalex.org/I78157498"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aravind Mohan","raw_affiliation_strings":["McMurry University,Department of Computer Science,Abilene,TX,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"McMurry University,Department of Computer Science,Abilene,TX,USA","institution_ids":["https://openalex.org/I78157498"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101750217","display_name":"Jianwu Wang","orcid":"https://orcid.org/0000-0002-9933-1170"},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jianwu Wang","raw_affiliation_strings":["University of Maryland, Baltimore County,Department of Information Systems,Baltimore,MD,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, Baltimore County,Department of Information Systems,Baltimore,MD,USA","institution_ids":["https://openalex.org/I79272384"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009690297"],"corresponding_institution_ids":["https://openalex.org/I79272384"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.76898848,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"468","last_page":"475"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.5134000182151794,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.5134000182151794,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.18549999594688416,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.019200000911951065,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.48410001397132874},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.3779999911785126},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.3522999882698059},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3301999866962433},{"id":"https://openalex.org/keywords/process-control","display_name":"Process control","score":0.28189998865127563}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5992000102996826},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.48410001397132874},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3779999911785126},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3522999882698059},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.351500004529953},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2939000129699707},{"id":"https://openalex.org/C155386361","wikidata":"https://www.wikidata.org/wiki/Q1649571","display_name":"Process control","level":3,"score":0.28189998865127563},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.26919999718666077}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmla66185.2025.00070","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00070","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306101","display_name":"National Aeronautics and Space Administration","ror":"https://ror.org/027ka1x80"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2509009443","https://openalex.org/W2597068831","https://openalex.org/W2745047326","https://openalex.org/W2977286878","https://openalex.org/W3022437934","https://openalex.org/W3131479975","https://openalex.org/W3164621937","https://openalex.org/W4205601070","https://openalex.org/W4214717370","https://openalex.org/W4304820446","https://openalex.org/W4309652652","https://openalex.org/W4312811994","https://openalex.org/W4382202987","https://openalex.org/W4382202996","https://openalex.org/W4382239144","https://openalex.org/W4382656719","https://openalex.org/W4389077433","https://openalex.org/W4405014024","https://openalex.org/W4405974735","https://openalex.org/W4409363746","https://openalex.org/W4409364052","https://openalex.org/W4416726501","https://openalex.org/W7133199514","https://openalex.org/W7133204973","https://openalex.org/W7133207146","https://openalex.org/W7133228143"],"related_works":[],"abstract_inverted_index":{"Dynamic":[0],"resource":[1,34,45,128,205],"allocation":[2,35,142],"for":[3,168,175,203],"machine":[4],"learning":[5,54,86],"workloads":[6,154],"in":[7,165,173,181,213],"cloud":[8,204],"environments":[9],"remains":[10],"challenging":[11],"due":[12],"to":[13,40,139,186],"competing":[14],"objectives":[15],"of":[16],"minimizing":[17],"training":[18,130,166,216],"time":[19,167],"and":[20,60,101,132,178,194,211,222],"operational":[21],"costs":[22,174],"while":[23,71],"meeting":[24],"Service":[25],"Level":[26],"Agreement":[27],"(SLA)":[28],"constraints.":[29],"Traditional":[30],"approaches":[31],"employ":[32],"static":[33,187],"or":[36,44,69,87],"single-objective":[37],"optimization,":[38],"leading":[39],"either":[41],"SLA":[42,73,114,133,183],"violations":[43],"waste.":[46],"We":[47],"present":[48],"SLA-MORL,":[49],"an":[50,136],"adaptive":[51],"multi-objective":[52],"reinforcement":[53],"framework":[55],"that":[56,91,106,160,207],"intelligently":[57],"allocates":[58],"GPU":[59],"CPU":[61],"resources":[62],"based":[63,111],"on":[64,112,150],"user-defined":[65],"preferences":[66],"(time,":[67],"cost,":[68,210],"balanced)":[70],"ensuring":[72],"compliance.":[74],"Our":[75,218],"approach":[76],"introduces":[77],"two":[78],"key":[79],"innovations:":[80],"(1)":[81],"intelligent":[82],"initialization":[83],"through":[84],"historical":[85],"efficient":[88],"baseline":[89],"runs":[90],"eliminates":[92],"cold-start":[93,192],"problems,":[94],"reducing":[95],"initial":[96],"exploration":[97],"overhead":[98],"by":[99],"60%,":[100],"(2)":[102],"dynamic":[103,195],"weight":[104],"adaptation":[105,196],"automatically":[107],"adjusts":[108],"optimization":[109],"priorities":[110],"real-time":[113],"violation":[115],"severity,":[116],"creating":[117],"a":[118,123,200],"self-correcting":[119],"system.":[120],"SLA-MORL":[121,161,198],"constructs":[122],"21-dimensional":[124],"state":[125],"representation":[126],"capturing":[127],"utilization,":[129],"progress,":[131],"compliance,":[134],"enabling":[135],"actor-critic":[137],"network":[138],"make":[140],"informed":[141],"decisions":[143],"across":[144],"9":[145],"possible":[146],"actions.":[147],"Extensive":[148],"evaluation":[149],"13":[151],"diverse":[152],"ML":[153,215],"using":[155],"production":[156],"HPC":[157],"infrastructure":[158],"demonstrates":[159],"achieves":[162],"67.2%":[163],"reduction":[164,172],"deadline-critical":[169],"jobs,":[170],"68.8%":[171],"budget-constrained":[176],"workloads,":[177],"73.4%":[179],"improvement":[180],"overall":[182],"compliance":[184],"compared":[185],"baselines.":[188],"By":[189],"addressing":[190],"both":[191],"inefficiency":[193],"challenges,":[197],"provides":[199],"practical":[201],"solution":[202],"management":[206],"balances":[208],"performance,":[209],"reliability":[212],"modern":[214],"environments.":[217],"code":[219],"is":[220],"open-source":[221],"available":[223],"at":[224],"https://github.com/big-data-lab-umbc/SLA-MORL.":[225]},"counts_by_year":[],"updated_date":"2026-04-30T09:15:22.047038","created_date":"2026-04-08T00:00:00"}
