{"id":"https://openalex.org/W7116701494","doi":"https://doi.org/10.23919/cnsm67658.2025.11297572","title":"Decentralized Intelligence for Centralized Control: Multi-Agent Reinforcement Learning for SD-WAN","display_name":"Decentralized Intelligence for Centralized Control: Multi-Agent Reinforcement Learning for SD-WAN","publication_year":2025,"publication_date":"2025-10-27","ids":{"openalex":"https://openalex.org/W7116701494","doi":"https://doi.org/10.23919/cnsm67658.2025.11297572"},"language":"en","primary_location":{"id":"doi:10.23919/cnsm67658.2025.11297572","is_oa":false,"landing_page_url":"https://doi.org/10.23919/cnsm67658.2025.11297572","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 21st International Conference on Network and Service Management (CNSM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120960153","display_name":"Elshan Khanlari","orcid":null},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Elshan Khanlari","raw_affiliation_strings":["University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092460583","display_name":"Luca Borgianni","orcid":"https://orcid.org/0009-0007-1097-0421"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Luca Borgianni","raw_affiliation_strings":["University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007526433","display_name":"Davide Adami","orcid":"https://orcid.org/0000-0003-3007-1400"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Davide Adami","raw_affiliation_strings":["University of Pisa,CNIT,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Pisa,CNIT,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010219752","display_name":"S. Giordano","orcid":null},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Stefano Giordano","raw_affiliation_strings":["University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Pisa,Dept. of Information Engineering, Via G. Caruso 16,Pisa,Italy,56122","institution_ids":["https://openalex.org/I108290504"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.58769349,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9079999923706055,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9079999923706055,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10138","display_name":"Network Traffic and Congestion Control","score":0.03779999911785126,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11158","display_name":"Wireless Networks and Protocols","score":0.010599999688565731,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8185999989509583},{"id":"https://openalex.org/keywords/underlay","display_name":"Underlay","score":0.6462000012397766},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6220999956130981},{"id":"https://openalex.org/keywords/overlay","display_name":"Overlay","score":0.5403000116348267},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.5177000164985657},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.47269999980926514},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.4544000029563904},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.4424999952316284}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8185999989509583},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.76910001039505},{"id":"https://openalex.org/C2777679929","wikidata":"https://www.wikidata.org/wiki/Q7883709","display_name":"Underlay","level":3,"score":0.6462000012397766},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6220999956130981},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5863000154495239},{"id":"https://openalex.org/C136085584","wikidata":"https://www.wikidata.org/wiki/Q910289","display_name":"Overlay","level":2,"score":0.5403000116348267},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.5177000164985657},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.47269999980926514},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.4544000029563904},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.4424999952316284},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.43549999594688416},{"id":"https://openalex.org/C169851745","wikidata":"https://www.wikidata.org/wiki/Q1331985","display_name":"Overlay network","level":3,"score":0.42309999465942383},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.40310001373291016},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.35420000553131104},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.3540000021457672},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.31150001287460327},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C205875254","wikidata":"https://www.wikidata.org/wiki/Q17156857","display_name":"Decentralised system","level":3,"score":0.289900004863739},{"id":"https://openalex.org/C104954878","wikidata":"https://www.wikidata.org/wiki/Q1648707","display_name":"Routing protocol","level":3,"score":0.28049999475479126},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C195563490","wikidata":"https://www.wikidata.org/wiki/Q180368","display_name":"Network congestion","level":3,"score":0.2567000091075897}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.23919/cnsm67658.2025.11297572","is_oa":false,"landing_page_url":"https://doi.org/10.23919/cnsm67658.2025.11297572","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 21st International Conference on Network and Service Management (CNSM)","raw_type":"proceedings-article"},{"id":"pmh:oai:arpi.unipi.it:11568/1347688","is_oa":false,"landing_page_url":"https://hdl.handle.net/11568/1347688","pdf_url":null,"source":{"id":"https://openalex.org/S4377196265","display_name":"CINECA IRIS Institutial research information system (University of Pisa)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I108290504","host_organization_name":"University of Pisa","host_organization_lineage":["https://openalex.org/I108290504"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W2099618002","https://openalex.org/W3108110215","https://openalex.org/W4316659488","https://openalex.org/W4385210519","https://openalex.org/W4392152258","https://openalex.org/W4392507942","https://openalex.org/W4412836831"],"related_works":[],"abstract_inverted_index":{"Modern":[0],"Software-Defined":[1],"Wide":[2],"Area":[3],"Network":[4],"(SDWAN)":[5],"deployments":[6],"are":[7],"required":[8],"to":[9,38,48,114],"manage":[10],"traffic":[11],"over":[12],"heterogeneous":[13],"underlay":[14],"networks":[15],"while":[16,119],"meeting":[17],"stringent":[18],"Quality":[19],"of":[20,98,164],"Service":[21],"(QoS)":[22],"requirements.":[23],"In":[24],"scenarios":[25],"where":[26],"multiple":[27],"branches":[28],"share":[29],"overlay":[30,70,174],"resources,":[31],"independent":[32],"tunnel":[33],"selection":[34,71],"decisions":[35,99],"often":[36],"lead":[37],"congestion":[39],"and":[40,151,170],"degraded":[41],"performance.":[42],"Existing":[43],"approaches":[44],"lack":[45],"coordination":[46],"mechanisms":[47],"handle":[49],"the":[50,89,95,104,162],"dynamic":[51],"interactions":[52],"between":[53],"agents":[54,113],"competing":[55],"for":[56,68,94],"shared":[57,173],"resources.":[58],"This":[59],"paper":[60],"presents":[61],"a":[62,130,155],"Multi-Agent":[63],"Reinforcement":[64],"Learning":[65],"(MARL)":[66],"framework":[67],"distributed":[69],"in":[72,154,166],"SD-WANs.":[73],"Each":[74],"branch":[75],"is":[76],"modeled":[77],"as":[78],"an":[79],"autonomous":[80],"agent":[81],"that":[82,135],"learns":[83],"routing":[84],"policies":[85],"through":[86],"interaction":[87],"with":[88,107,140],"network":[90],"environment.":[91,158],"To":[92,124],"account":[93],"mutual":[96],"impact":[97],"across":[100],"branches,":[101],"we":[102,128],"adopt":[103],"Centralized":[105],"Training":[106],"Decentralized":[108],"Execution":[109],"(CTDE)":[110],"paradigm,":[111],"enabling":[112],"learn":[115],"globally":[116],"consistent":[117],"behaviors":[118],"preserving":[120],"scalability":[121],"at":[122],"inference.":[123],"encourage":[125],"cooperative":[126],"policies,":[127],"introduce":[129],"$\\lambda$-weighted":[131],"reward":[132],"shaping":[133],"mechanism":[134],"balances":[136],"local":[137],"QoS":[138],"goals":[139],"global":[141],"resource":[142,168],"fairness.":[143],"We":[144],"evaluate":[145],"our":[146],"approach":[147],"using":[148],"both":[149],"PPO":[150],"DQN":[152],"algorithms":[153],"simulated":[156],"SD-WAN":[157],"The":[159],"findings":[160],"highlight":[161],"necessity":[163],"MARL":[165],"addressing":[167],"contention":[169],"ensuring":[171],"equitable":[172],"utilization.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-22T00:00:00"}
