{"id":"https://openalex.org/W4415427998","doi":"https://doi.org/10.3233/faia251266","title":"GraphSem: Robust Multi-Agent Reinforcement Learning via Semantic-Graph Communication","display_name":"GraphSem: Robust Multi-Agent Reinforcement Learning via Semantic-Graph Communication","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415427998","doi":"https://doi.org/10.3233/faia251266"},"language":null,"primary_location":{"id":"doi:10.3233/faia251266","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251266","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia251266","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027931296","display_name":"Zaipeng Xie","orcid":"https://orcid.org/0000-0003-1637-1511"},"institutions":[{"id":"https://openalex.org/I4210155611","display_name":"Ministry of Water Resources of the People's Republic of China","ror":"https://ror.org/04e698d63","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210155611"]},{"id":"https://openalex.org/I163340411","display_name":"Hohai University","ror":"https://ror.org/01wd4xt90","country_code":"CN","type":"education","lineage":["https://openalex.org/I163340411"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zaipeng Xie","raw_affiliation_strings":["College of Computer Science and Software Engineering, Hohai University, Nanjing, China","Key Laboratory of Water Big Data Technology of Ministry of Water Resources, Hohai University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Hohai University, Nanjing, China","institution_ids":["https://openalex.org/I163340411"]},{"raw_affiliation_string":"Key Laboratory of Water Big Data Technology of Ministry of Water Resources, Hohai University, Nanjing, China","institution_ids":["https://openalex.org/I163340411","https://openalex.org/I4210155611"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100680832","display_name":"Yaowu Wang","orcid":"https://orcid.org/0000-0001-8853-8988"},"institutions":[{"id":"https://openalex.org/I163340411","display_name":"Hohai University","ror":"https://ror.org/01wd4xt90","country_code":"CN","type":"education","lineage":["https://openalex.org/I163340411"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaowu Wang","raw_affiliation_strings":["College of Computer Science and Software Engineering, Hohai University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Hohai University, Nanjing, China","institution_ids":["https://openalex.org/I163340411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027713037","display_name":"Sitong Shen","orcid":"https://orcid.org/0009-0003-4841-8414"},"institutions":[{"id":"https://openalex.org/I163340411","display_name":"Hohai University","ror":"https://ror.org/01wd4xt90","country_code":"CN","type":"education","lineage":["https://openalex.org/I163340411"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sitong Shen","raw_affiliation_strings":["College of Computer Science and Software Engineering, Hohai University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Hohai University, Nanjing, China","institution_ids":["https://openalex.org/I163340411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100460591","display_name":"Jianan Zhang","orcid":"https://orcid.org/0000-0003-3318-2165"},"institutions":[{"id":"https://openalex.org/I163340411","display_name":"Hohai University","ror":"https://ror.org/01wd4xt90","country_code":"CN","type":"education","lineage":["https://openalex.org/I163340411"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianan Zhang","raw_affiliation_strings":["College of Computer Science and Software Engineering, Hohai University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Hohai University, Nanjing, China","institution_ids":["https://openalex.org/I163340411"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5027931296"],"corresponding_institution_ids":["https://openalex.org/I163340411","https://openalex.org/I4210155611"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.50371654,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.8952000141143799,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.8952000141143799,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7657999992370605},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5309000015258789},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.48829999566078186},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.47870001196861267},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.32679998874664307},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.31220000982284546}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7657999992370605},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.739799976348877},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5309000015258789},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.48829999566078186},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.47870001196861267},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44670000672340393},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.38989999890327454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3393000066280365},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.32679998874664307},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C101765175","wikidata":"https://www.wikidata.org/wiki/Q577764","display_name":"Communications system","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29100000858306885},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.27239999175071716}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia251266","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251266","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia251266","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251266","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multi-agent":[0],"reinforcement":[1],"learning":[2],"has":[3],"achieved":[4],"substantial":[5],"progress":[6],"under":[7,48,154],"the":[8],"centralized":[9],"training":[10],"with":[11,122],"decentralized":[12],"execution":[13],"framework.":[14],"However,":[15],"most":[16],"existing":[17],"methods":[18],"assume":[19],"deterministic":[20],"and":[21,51,73,97,108,141,152],"noise-free":[22],"local":[23],"observations,":[24,64],"limiting":[25],"applicability":[26],"to":[27,44,59,94,126,147],"real-world":[28,87],"environments":[29],"characterized":[30],"by":[31],"stochastic":[32,155],"partial":[33],"observability.":[34],"This":[35],"paper":[36],"introduces":[37],"GraphSem,":[38],"a":[39],"semantic-graph":[40],"communication":[41,71,143],"framework":[42],"designed":[43],"enhance":[45],"agent":[46],"coordination":[47,120],"observation":[49],"uncertainty":[50],"randomized":[52],"initial":[53,98],"conditions.":[54,156],"Graph-Sem":[55],"employs":[56],"Transformer-based":[57],"encoders":[58],"abstract":[60],"higher-level":[61],"features":[62,68],"from":[63],"selectively":[65],"transmits":[66],"these":[67],"via":[69],"dynamic":[70],"weighting,":[72],"fuses":[74],"inter-agent":[75],"information":[76],"through":[77],"an":[78],"attention-guided":[79],"graph":[80],"convolutional":[81],"network.":[82],"To":[83],"approximate":[84],"aspects":[85],"of":[86,106,124],"sensing":[88],"challenges,":[89],"we":[90],"introduce":[91],"controlled":[92],"stochasticity":[93],"both":[95],"observations":[96],"states":[99],"during":[100],"training.":[101],"Experiments":[102],"on":[103],"perturbed":[104],"variants":[105],"SMAC":[107],"Traffic":[109],"Junction":[110],"benchmarks":[111],"show":[112],"that":[113,135],"GraphSem":[114],"outperforms":[115],"state-of-the-art":[116],"baselines":[117],"across":[118],"diverse":[119],"tasks,":[121],"improvements":[123],"up":[125],"30.4%":[127],"in":[128],"average":[129],"win":[130],"rates.":[131],"Ablation":[132],"studies":[133],"suggest":[134],"semantic":[136],"encoding,":[137],"graph-based":[138],"message":[139],"fusion,":[140],"adaptive":[142],"mechanisms":[144],"collectively":[145],"contribute":[146],"enhanced":[148],"robustness,":[149],"sample":[150],"efficiency,":[151],"performance":[153]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
