{"id":"https://openalex.org/W4205998584","doi":"https://doi.org/10.1145/3491396.3506544","title":"Multi-Agent Reinforcement Learning based on Two-Step Neighborhood Experience for Traffic Light Control","display_name":"Multi-Agent Reinforcement Learning based on Two-Step Neighborhood Experience for Traffic Light Control","publication_year":2021,"publication_date":"2021-12-28","ids":{"openalex":"https://openalex.org/W4205998584","doi":"https://doi.org/10.1145/3491396.3506544"},"language":"en","primary_location":{"id":"doi:10.1145/3491396.3506544","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3491396.3506544","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 ACM International Conference on Intelligent Computing and its Emerging Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057990943","display_name":"Yuchen Luo","orcid":"https://orcid.org/0000-0002-8754-1453"},"institutions":[{"id":"https://openalex.org/I142974352","display_name":"National Sun Yat-sen University","ror":"https://ror.org/00mjawt10","country_code":"TW","type":"education","lineage":["https://openalex.org/I142974352"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Yu-Chen Luo","raw_affiliation_strings":["Department of Computer Science and Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan","institution_ids":["https://openalex.org/I142974352"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057441996","display_name":"Chun\u2010Wei Tsai","orcid":"https://orcid.org/0000-0003-0128-4052"},"institutions":[{"id":"https://openalex.org/I142974352","display_name":"National Sun Yat-sen University","ror":"https://ror.org/00mjawt10","country_code":"TW","type":"education","lineage":["https://openalex.org/I142974352"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun-Wei Tsai","raw_affiliation_strings":["Department of Computer Science and Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan","institution_ids":["https://openalex.org/I142974352"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5057990943"],"corresponding_institution_ids":["https://openalex.org/I142974352"],"apc_list":null,"apc_paid":null,"fwci":0.1373,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.48710114,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"28","last_page":"33"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8179547786712646},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7307712435722351},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.7164418697357178},{"id":"https://openalex.org/keywords/plan","display_name":"Plan (archaeology)","score":0.5336279273033142},{"id":"https://openalex.org/keywords/traffic-signal","display_name":"Traffic signal","score":0.5279518365859985},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5243169069290161},{"id":"https://openalex.org/keywords/traffic-congestion","display_name":"Traffic congestion","score":0.48297634720802307},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3648710250854492},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.27105116844177246},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25066226720809937},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.19360923767089844},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.14686986804008484}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8179547786712646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7307712435722351},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.7164418697357178},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.5336279273033142},{"id":"https://openalex.org/C2987419075","wikidata":"https://www.wikidata.org/wiki/Q8004","display_name":"Traffic signal","level":2,"score":0.5279518365859985},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5243169069290161},{"id":"https://openalex.org/C2779888511","wikidata":"https://www.wikidata.org/wiki/Q244156","display_name":"Traffic congestion","level":2,"score":0.48297634720802307},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3648710250854492},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.27105116844177246},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25066226720809937},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.19360923767089844},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.14686986804008484},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3491396.3506544","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3491396.3506544","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 ACM International Conference on Intelligent Computing and its Emerging Applications","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.8199999928474426}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W33871791","https://openalex.org/W1641379095","https://openalex.org/W2017277097","https://openalex.org/W2031530760","https://openalex.org/W2074500080","https://openalex.org/W2076337359","https://openalex.org/W2088595989","https://openalex.org/W2106948551","https://openalex.org/W2125001944","https://openalex.org/W2146087064","https://openalex.org/W2260756217","https://openalex.org/W2395575420","https://openalex.org/W2402402867","https://openalex.org/W2498017881","https://openalex.org/W2530263920","https://openalex.org/W2548134372","https://openalex.org/W2761656023","https://openalex.org/W2801573006","https://openalex.org/W2907606902","https://openalex.org/W2915117209","https://openalex.org/W2964043796","https://openalex.org/W2964338167","https://openalex.org/W2995815314","https://openalex.org/W3125860949","https://openalex.org/W4236158019","https://openalex.org/W4288601262","https://openalex.org/W6601295022","https://openalex.org/W6637967152","https://openalex.org/W6669402789","https://openalex.org/W6986888325","https://openalex.org/W7001212498"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W4367838498","https://openalex.org/W3115426489","https://openalex.org/W4293167677"],"abstract_inverted_index":{"Several":[0],"recent":[1],"studies":[2],"pointed":[3],"out":[4],"that":[5,195],"an":[6,99,118,123,138],"effective":[7,119,124],"traffic":[8,18,50,79,97,112,140,162,216],"signal/light":[9],"control":[10,51,80,114,142,218],"strategy":[11],"will":[12],"be":[13,93],"able":[14],"to":[15,127,136,154],"mitigate":[16],"the":[17,42,73,78,104,107,111,129,157,167,170,181,196,207],"congestion":[19],"problem,":[20,115],"and":[21],"therefore":[22],"variants":[23],"of":[24,41,64,75,87,98,106,133,159,169,183,185,201],"solutions":[25],"have":[26],"been":[27],"presented":[28,150],"for":[29,53,95,161,215],"solving":[30,110],"this":[31,152,190,213],"optimization":[32],"problem.":[33],"The":[34,192],"multi-agent":[35],"reinforcement":[36],"learning":[37],"(MARL)":[38],"is":[39,149,199],"one":[40],"promising":[43],"methods":[44],"because":[45,58],"it":[46,175],"can":[47],"provide":[48],"good":[49],"strategies":[52],"such":[54,84],"complex":[55],"environments.":[56],"However,":[57],"each":[59],"agent":[60],"on":[61,83,122,180],"its":[62,76],"intersection":[63],"most":[65],"MARL-based":[66],"algorithms":[67,179,210],"has":[68],"only":[69],"partial":[70],"information":[71,86,130],"from":[72],"observations":[74],"intersection,":[77],"plan":[81],"based":[82,121],"incomplete":[85],"all":[88,206],"agents":[89,132],"may":[90],"not":[91],"always":[92],"useful":[94],"improving":[96],"entire":[100],"city.":[101],"To":[102,165],"enhance":[103],"performance":[105,158,168],"MARL":[108,160],"in":[109,151,189,212],"light":[113,141,163,217],"we":[116,173],"present":[117],"algorithm":[120,198],"communication":[125],"protocol":[126],"share":[128],"between":[131],"neighbor":[134],"intersections":[135],"make":[137],"integrated":[139],"plan.":[143],"Moreover,":[144],"a":[145],"two-step":[146],"decision":[147],"mechanism":[148],"study":[153,214],"further":[155],"improve":[156],"control.":[164],"evaluate":[166],"proposed":[171,197],"algorithm,":[172],"compared":[174,211],"with":[176],"several":[177],"message-passing-based":[178,209],"simulator":[182],"Simulation":[184],"Urban":[186],"MObility":[187],"(SUMO)":[188],"study.":[191],"results":[193,204],"show":[194],"capable":[200],"finding":[202],"better":[203],"than":[205],"other":[208],"problems.":[219]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
