{"id":"https://openalex.org/W3100293451","doi":"https://doi.org/10.1145/3529375","title":"RL-QN: A Reinforcement Learning Framework for Optimal Control of Queueing Systems","display_name":"RL-QN: A Reinforcement Learning Framework for Optimal Control of Queueing Systems","publication_year":2022,"publication_date":"2022-03-31","ids":{"openalex":"https://openalex.org/W3100293451","doi":"https://doi.org/10.1145/3529375","mag":"3100293451"},"language":"en","primary_location":{"id":"doi:10.1145/3529375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3529375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3529375","source":{"id":"https://openalex.org/S4210231956","display_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","issn_l":"2376-3639","issn":["2376-3639","2376-3647"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3529375","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042253177","display_name":"Bai Liu","orcid":"https://orcid.org/0000-0002-3950-4965"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bai Liu","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, MA"],"raw_orcid":"https://orcid.org/0000-0002-3950-4965","affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008882694","display_name":"Qiaomin Xie","orcid":"https://orcid.org/0000-0003-2834-6866"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qiaomin Xie","raw_affiliation_strings":["University of Wisconsin-Madison, Madison, WI"],"raw_orcid":"https://orcid.org/0000-0003-2834-6866","affiliations":[{"raw_affiliation_string":"University of Wisconsin-Madison, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036587377","display_name":"Eytan Modiano","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eytan Modiano","raw_affiliation_strings":["Massachusetts Institute of Technology, Cambridge, MA"],"raw_orcid":"https://orcid.org/0000-0001-8238-8130","affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology, Cambridge, MA","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.9964,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.86348835,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"7","issue":"1","first_page":"1","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10974","display_name":"Advanced Queuing Theory Analysis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9089579582214355},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7713131904602051},{"id":"https://openalex.org/keywords/queueing-theory","display_name":"Queueing theory","score":0.7624430656433105},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.6901962161064148},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.6571670174598694},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5763940811157227},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.5495903491973877},{"id":"https://openalex.org/keywords/layered-queueing-network","display_name":"Layered queueing network","score":0.5414528846740723},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5238247513771057},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4419364333152771},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3992646336555481},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.2528305649757385},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16005128622055054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1543559730052948},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15176787972450256}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9089579582214355},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7713131904602051},{"id":"https://openalex.org/C22684755","wikidata":"https://www.wikidata.org/wiki/Q847526","display_name":"Queueing theory","level":2,"score":0.7624430656433105},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.6901962161064148},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.6571670174598694},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5763940811157227},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.5495903491973877},{"id":"https://openalex.org/C33891772","wikidata":"https://www.wikidata.org/wiki/Q6505536","display_name":"Layered queueing network","level":3,"score":0.5414528846740723},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5238247513771057},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4419364333152771},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3992646336555481},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2528305649757385},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16005128622055054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1543559730052948},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15176787972450256},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3529375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3529375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3529375","source":{"id":"https://openalex.org/S4210231956","display_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","issn_l":"2376-3639","issn":["2376-3639","2376-3647"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","raw_type":"journal-article"},{"id":"pmh:oai:dspace.mit.edu:1721.1/145441","is_oa":true,"landing_page_url":"https://hdl.handle.net/1721.1/145441","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv","raw_type":"http://purl.org/eprint/type/JournalArticle"},{"id":"pmh:oai:dspace.mit.edu:1721.1/145441.2","is_oa":true,"landing_page_url":"https://hdl.handle.net/1721.1/145441.2","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ACM","raw_type":"http://purl.org/eprint/type/JournalArticle"}],"best_oa_location":{"id":"doi:10.1145/3529375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3529375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3529375","source":{"id":"https://openalex.org/S4210231956","display_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","issn_l":"2376-3639","issn":["2376-3639","2376-3647"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Modeling and Performance Evaluation of Computing Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.550000011920929}],"awards":[{"id":"https://openalex.org/G3431152219","display_name":"CNS Core: Small: Wireless Network Control in Uncooperative and Adversarial Environments","funder_award_id":"1907905","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4949411081","display_name":null,"funder_award_id":"N00014-20-1-2119","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G7873380069","display_name":null,"funder_award_id":"CNS-1907905","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8409476322","display_name":"NeTS: Small:  A Migration Approach to Optimal Control of Wireless Networks","funder_award_id":"1524317","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8445870396","display_name":null,"funder_award_id":"CNS-1524317","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3100293451.pdf","grobid_xml":"https://content.openalex.org/works/W3100293451.grobid-xml"},"referenced_works_count":64,"referenced_works":["https://openalex.org/W9378068","https://openalex.org/W21934178","https://openalex.org/W32403112","https://openalex.org/W55761002","https://openalex.org/W1530975313","https://openalex.org/W1597460884","https://openalex.org/W1606815489","https://openalex.org/W1628466589","https://openalex.org/W1646707810","https://openalex.org/W1662803991","https://openalex.org/W1845202788","https://openalex.org/W1850488217","https://openalex.org/W1973022038","https://openalex.org/W1995713768","https://openalex.org/W2003346154","https://openalex.org/W2004964364","https://openalex.org/W2020677283","https://openalex.org/W2042216697","https://openalex.org/W2042545172","https://openalex.org/W2074823898","https://openalex.org/W2093892790","https://openalex.org/W2095454008","https://openalex.org/W2098432798","https://openalex.org/W2103048107","https://openalex.org/W2103098926","https://openalex.org/W2104517640","https://openalex.org/W2111764152","https://openalex.org/W2120344179","https://openalex.org/W2125591683","https://openalex.org/W2126878542","https://openalex.org/W2132940773","https://openalex.org/W2133499361","https://openalex.org/W2135663206","https://openalex.org/W2155027007","https://openalex.org/W2156006461","https://openalex.org/W2156738026","https://openalex.org/W2157179371","https://openalex.org/W2165768656","https://openalex.org/W2168049152","https://openalex.org/W2168739325","https://openalex.org/W2170400507","https://openalex.org/W2293168792","https://openalex.org/W2333199285","https://openalex.org/W2466174699","https://openalex.org/W2556422671","https://openalex.org/W2565612488","https://openalex.org/W2585430551","https://openalex.org/W2612336410","https://openalex.org/W2768473197","https://openalex.org/W2790924949","https://openalex.org/W2793477598","https://openalex.org/W2898231005","https://openalex.org/W2963079995","https://openalex.org/W2963561337","https://openalex.org/W2963654220","https://openalex.org/W2999204576","https://openalex.org/W3020125231","https://openalex.org/W3046060145","https://openalex.org/W3099885902","https://openalex.org/W3105861207","https://openalex.org/W3151804457","https://openalex.org/W3196847620","https://openalex.org/W4256307687","https://openalex.org/W4300848284"],"related_works":["https://openalex.org/W1701464461","https://openalex.org/W36834199","https://openalex.org/W2168047232","https://openalex.org/W2121863833","https://openalex.org/W2137668347","https://openalex.org/W2149540948","https://openalex.org/W2170282368","https://openalex.org/W1977970311","https://openalex.org/W1600602066","https://openalex.org/W1556477456"],"abstract_inverted_index":{"With":[0],"the":[1,15,59,68,74,87,92,121,131,134,139,155,175],"rapid":[2],"advance":[3],"of":[4,33,91,120,133],"information":[5],"technology,":[6],"network":[7,29,39,93],"systems":[8],"have":[9],"become":[10],"increasingly":[11],"complex":[12],"and":[13,166],"hence":[14],"underlying":[16],"system":[17],"dynamics":[18],"are":[19],"often":[20],"unknown":[21],"or":[22,44],"difficult":[23],"to":[24,36,57,154],"characterize.":[25],"Finding":[26],"a":[27,102,117,126],"good":[28],"control":[30,61,94],"policy":[31,62,129],"is":[32,78],"significant":[34],"importance":[35],"achieve":[37],"desirable":[38],"performance":[40],"(e.g.,":[41],"high":[42],"throughput":[43],"low":[45],"delay).":[46],"In":[47],"this":[48,98],"work,":[49],"we":[50,100],"consider":[51],"using":[52],"model-based":[53,113],"reinforcement":[54],"learning":[55],"(RL)":[56],"learn":[58],"optimal":[60,156],"for":[63,107,130],"queueing":[64],"networks":[65],"so":[66],"that":[67,138,172],"average":[69,75,140,176],"job":[70],"delay":[71],"(or":[72],"equivalently":[73],"queue":[76,141,177],"backlog)":[77],"minimized.":[79],"Traditional":[80],"approaches":[81],"in":[82,161],"RL,":[83],"however,":[84],"cannot":[85],"handle":[86],"unbounded":[88],"state":[89,122],"spaces":[90],"problem.":[95],"To":[96],"overcome":[97],"difficulty,":[99],"propose":[101],"new":[103],"algorithm,":[104],"called":[105],"RL":[106,114],"Queueing":[108],"Networks":[109],"(RL-QN),":[110],"which":[111],"applies":[112],"methods":[115],"over":[116],"finite":[118],"subset":[119,149],"space":[123],"while":[124],"applying":[125],"known":[127],"stabilizing":[128],"rest":[132],"states.":[135],"We":[136,158],"establish":[137],"backlog":[142,178],"under":[143],"RL-QN":[144,160,173],"with":[145],"an":[146],"appropriately":[147],"constructed":[148],"can":[150],"be":[151],"arbitrarily":[152],"close":[153],"result.":[157],"evaluate":[159],"dynamic":[162],"server":[163],"allocation,":[164],"routing,":[165],"switching":[167],"problems.":[168],"Simulation":[169],"results":[170],"show":[171],"minimizes":[174],"effectively.":[179]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":6},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
