{"id":"https://openalex.org/W4394628748","doi":"https://doi.org/10.1109/cloudnet59005.2023.10490082","title":"RoMA: Resilient Multi-Agent Reinforcement Learning with Dynamic Participating Agents","display_name":"RoMA: Resilient Multi-Agent Reinforcement Learning with Dynamic Participating Agents","publication_year":2023,"publication_date":"2023-11-01","ids":{"openalex":"https://openalex.org/W4394628748","doi":"https://doi.org/10.1109/cloudnet59005.2023.10490082"},"language":"en","primary_location":{"id":"doi:10.1109/cloudnet59005.2023.10490082","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cloudnet59005.2023.10490082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 12th International Conference on Cloud Networking (CloudNet)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057903994","display_name":"Xuting Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuting Tang","raw_affiliation_strings":["Stevens Institute of Technology,Computer Science Department,Hoboken,USA","Computer Science Department, Stevens Institute of Technology, Hoboken, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stevens Institute of Technology,Computer Science Department,Hoboken,USA","institution_ids":["https://openalex.org/I108468826"]},{"raw_affiliation_string":"Computer Science Department, Stevens Institute of Technology, Hoboken, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100296405","display_name":"Xu Jia","orcid":"https://orcid.org/0009-0009-6543-4188"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jia Xu","raw_affiliation_strings":["Stevens Institute of Technology,Computer Science Department,Hoboken,USA","Computer Science Department, Stevens Institute of Technology, Hoboken, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stevens Institute of Technology,Computer Science Department,Hoboken,USA","institution_ids":["https://openalex.org/I108468826"]},{"raw_affiliation_string":"Computer Science Department, Stevens Institute of Technology, Hoboken, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100661401","display_name":"Shusen Wang","orcid":"https://orcid.org/0000-0003-3928-6782"},"institutions":[{"id":"https://openalex.org/I862669128","display_name":"Xiaomi (China)","ror":"https://ror.org/029f7bn57","country_code":"CN","type":"company","lineage":["https://openalex.org/I862669128"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shusen Wang","raw_affiliation_strings":["Xiaohongshu Inc,Shanghai,China","Xiaohongshu Inc, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiaohongshu Inc,Shanghai,China","institution_ids":["https://openalex.org/I862669128"]},{"raw_affiliation_string":"Xiaohongshu Inc, Shanghai, China","institution_ids":["https://openalex.org/I862669128"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60542736,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"247","last_page":"255"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7513999938964844,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7513999938964844,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8278940916061401},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6560254096984863},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.42395636439323425},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.41978245973587036},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38256555795669556},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.10884886980056763},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.07263946533203125}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8278940916061401},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6560254096984863},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.42395636439323425},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.41978245973587036},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38256555795669556},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.10884886980056763},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07263946533203125}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cloudnet59005.2023.10490082","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cloudnet59005.2023.10490082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 12th International Conference on Cloud Networking (CloudNet)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1542941925","https://openalex.org/W1606056663","https://openalex.org/W2091565802","https://openalex.org/W2133564696","https://openalex.org/W2267186426","https://openalex.org/W2602275733","https://openalex.org/W2617547828","https://openalex.org/W2913668833","https://openalex.org/W2978148161","https://openalex.org/W2991046523","https://openalex.org/W2996786181","https://openalex.org/W4225665995","https://openalex.org/W4299802797","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6679434410","https://openalex.org/W6738796088","https://openalex.org/W6748839928","https://openalex.org/W6749304979","https://openalex.org/W6755069753","https://openalex.org/W6768731700","https://openalex.org/W6784778700","https://openalex.org/W6788165329","https://openalex.org/W6792529980","https://openalex.org/W6795139234"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"RoMA,":[3],"a":[4,42,101,107,135,193],"novel":[5,102],"resilient":[6],"Multi-Agent":[7],"Reinforcement":[8],"Learning":[9],"(MARL)":[10],"framework":[11],"designed":[12],"to":[13,64,72,80,111,117,131,167,171,192],"handle":[14,177],"dynamic":[15],"participating":[16],"agents":[17,62,68,116,124,130,140,152,169,181],"during":[18,119],"centralized":[19,120],"training,":[20],"addressing":[21],"the":[22,113,132,142,150,178,184],"limitations":[23],"of":[24,38,88,115,180,186,196],"standard":[25,57,76],"MARL":[26,58,77,197],"frameworks":[27],"in":[28,52,134],"accommodating":[29],"agent":[30],"variability":[31],"and":[32,36,44,50,83,106,138,174,203],"enabling":[33],"efficient":[34],"adaptation":[35],"training":[37,49,143,149,185],"agents,":[39],"thus":[40],"providing":[41],"scalable":[43],"flexible":[45],"solution":[46],"for":[47],"model":[48],"execution":[51],"cloud":[53],"computing":[54],"environments.":[55,205],"For":[56],"frameworks,":[59],"if":[60],"new":[61,123,168],"need":[63,79],"join":[65],"or":[66],"existing":[67],"leave":[69,141],"unexpectedly":[70],"due":[71],"unreliable":[73],"communication":[74],"channels,":[75],"models":[78],"be":[81],"rebuilt":[82],"trained":[84],"from":[85],"scratch":[86],"because":[87],"their":[89],"structural":[90],"limitations,":[91],"which":[92],"is":[93,159,190],"very":[94],"time-consuming.":[95],"RoMA":[96,126,146,158,189],"addresses":[97],"this":[98],"issue":[99],"with":[100],"neural":[103],"network":[104],"architecture":[105],"few-shot":[108],"learning":[109],"algorithm":[110],"enable":[112],"number":[114],"vary":[118],"training.":[121],"When":[122],"join,":[125],"can":[127,147,176],"adapt":[128],"all":[129],"change":[133],"few":[136],"shots,":[137],"when":[139],"process":[144],"unexpectedly,":[145],"continue":[148],"remaining":[151],"without":[153,182],"disruption.Our":[154],"experiments":[155],"demonstrate":[156],"that":[157],"at":[160,165],"least":[161],"70":[162],"times":[163],"faster":[164],"adapting":[166],"compared":[170],"baseline":[172],"methods,":[173],"it":[175],"leaving":[179],"affecting":[183],"other":[187],"agents.":[188],"applicable":[191],"wide":[194],"range":[195],"settings,":[198],"including":[199],"cooperative,":[200],"competitive,":[201],"independent,":[202],"mixed":[204]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}