{"id":"https://openalex.org/W3030840723","doi":"https://doi.org/10.1109/tvt.2020.2997896","title":"Multi-Agent Deep Reinforcement Learning for Urban Traffic Light Control in Vehicular Networks","display_name":"Multi-Agent Deep Reinforcement Learning for Urban Traffic Light Control in Vehicular Networks","publication_year":2020,"publication_date":"2020-05-28","ids":{"openalex":"https://openalex.org/W3030840723","doi":"https://doi.org/10.1109/tvt.2020.2997896","mag":"3030840723"},"language":"en","primary_location":{"id":"doi:10.1109/tvt.2020.2997896","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2020.2997896","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://resolver.sub.uni-goettingen.de/purl?gro-2/135746","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000348675","display_name":"Tong Wu","orcid":"https://orcid.org/0000-0002-7474-6943"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tong Wu","raw_affiliation_strings":["School of Electrical Information and Communication Engineering, Huazhong University of Science & Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Information and Communication Engineering, Huazhong University of Science & Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693197","display_name":"Pan Zhou","orcid":"https://orcid.org/0000-0002-8629-4622"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pan Zhou","raw_affiliation_strings":["Hubei Engineering Research Center on Big Data Security, School of Cyber Science and Engineering, Huazhong University of Science & Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Hubei Engineering Research Center on Big Data Security, School of Cyber Science and Engineering, Huazhong University of Science & Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100399797","display_name":"Kai Liu","orcid":"https://orcid.org/0000-0001-5865-7724"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Liu","raw_affiliation_strings":["College of Computer Science, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034831625","display_name":"Yali Yuan","orcid":"https://orcid.org/0000-0002-9258-9929"},"institutions":[{"id":"https://openalex.org/I74656192","display_name":"University of G\u00f6ttingen","ror":"https://ror.org/01y9bpm73","country_code":"DE","type":"education","lineage":["https://openalex.org/I74656192"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Yali Yuan","raw_affiliation_strings":["Institute of Computer Science, G\u00f6ttingen University, G\u00f6ttingen, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Science, G\u00f6ttingen University, G\u00f6ttingen, Germany","institution_ids":["https://openalex.org/I74656192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100732173","display_name":"Xiumin Wang","orcid":"https://orcid.org/0000-0002-3772-290X"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiumin Wang","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047931252","display_name":"Huawei Huang","orcid":"https://orcid.org/0000-0002-7035-6446"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huawei Huang","raw_affiliation_strings":["School of Data and Computer Science, Sun Yat-Sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, Sun Yat-Sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001469325","display_name":"Dapeng Wu","orcid":"https://orcid.org/0000-0003-1755-0183"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dapeng Oliver Wu","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Florida, Gainesville, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Florida, Gainesville, USA","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5000348675"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":19.3386,"has_fulltext":false,"cited_by_count":284,"citation_normalized_percentile":{"value":0.99727986,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"69","issue":"8","first_page":"8243","last_page":"8256"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9159356355667114},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.7578567266464233},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6848620176315308},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5013823509216309},{"id":"https://openalex.org/keywords/traffic-congestion","display_name":"Traffic congestion","score":0.46796566247940063},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4032769799232483},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36884987354278564},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2511258125305176},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.16697600483894348}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9159356355667114},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.7578567266464233},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6848620176315308},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5013823509216309},{"id":"https://openalex.org/C2779888511","wikidata":"https://www.wikidata.org/wiki/Q244156","display_name":"Traffic congestion","level":2,"score":0.46796566247940063},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4032769799232483},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36884987354278564},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2511258125305176},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.16697600483894348},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tvt.2020.2997896","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2020.2997896","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"},{"id":"pmh:oai:publications.goettingen-research-online.de:2/135746","is_oa":true,"landing_page_url":"https://resolver.sub.uni-goettingen.de/purl?gro-2/135746","pdf_url":null,"source":{"id":"https://openalex.org/S4306401634","display_name":"GoeScholar  The Publication Server of the Georg-August-Universit\u00e4t G\u00f6ttingen (Georg-August-Universit\u00e4t G\u00f6ttingen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210122495","host_organization_name":"Asklepios Klinik St. Georg","host_organization_lineage":["https://openalex.org/I4210122495"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:publications.goettingen-research-online.de:2/135746","is_oa":true,"landing_page_url":"https://resolver.sub.uni-goettingen.de/purl?gro-2/135746","pdf_url":null,"source":{"id":"https://openalex.org/S4306401634","display_name":"GoeScholar  The Publication Server of the Georg-August-Universit\u00e4t G\u00f6ttingen (Georg-August-Universit\u00e4t G\u00f6ttingen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210122495","host_organization_name":"Asklepios Klinik St. Georg","host_organization_lineage":["https://openalex.org/I4210122495"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"score":0.5199999809265137,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G1051005861","display_name":null,"funder_award_id":"61902445","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1587288833","display_name":null,"funder_award_id":"19lgpy222","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G5526602072","display_name":null,"funder_award_id":"61872150","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5817064308","display_name":null,"funder_award_id":"61972448","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8071503822","display_name":null,"funder_award_id":"2019A1515011798","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G8722765671","display_name":null,"funder_award_id":"61872049","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W33871791","https://openalex.org/W138497752","https://openalex.org/W1516835682","https://openalex.org/W1522301498","https://openalex.org/W1542941925","https://openalex.org/W1583936024","https://openalex.org/W1986659999","https://openalex.org/W2037067712","https://openalex.org/W2064675550","https://openalex.org/W2088595989","https://openalex.org/W2101460915","https://openalex.org/W2107846430","https://openalex.org/W2119567691","https://openalex.org/W2121092017","https://openalex.org/W2121863487","https://openalex.org/W2125001944","https://openalex.org/W2134295053","https://openalex.org/W2136029154","https://openalex.org/W2141554657","https://openalex.org/W2145339207","https://openalex.org/W2149012699","https://openalex.org/W2164732484","https://openalex.org/W2173248099","https://openalex.org/W2210077926","https://openalex.org/W2291973609","https://openalex.org/W2548134372","https://openalex.org/W2604427121","https://openalex.org/W2606342131","https://openalex.org/W2613084637","https://openalex.org/W2741077351","https://openalex.org/W2785315072","https://openalex.org/W2794842204","https://openalex.org/W2809148419","https://openalex.org/W2898015307","https://openalex.org/W2902021809","https://openalex.org/W2903512535","https://openalex.org/W2962938178","https://openalex.org/W2962992123","https://openalex.org/W2963039558","https://openalex.org/W2963407617","https://openalex.org/W2963658727","https://openalex.org/W2963864421","https://openalex.org/W2964121744","https://openalex.org/W2964247745","https://openalex.org/W3100789280","https://openalex.org/W3106357768","https://openalex.org/W4299802797","https://openalex.org/W6605711098","https://openalex.org/W6630901103","https://openalex.org/W6631190155","https://openalex.org/W6635087183","https://openalex.org/W6677939520","https://openalex.org/W6681027470","https://openalex.org/W6684921986","https://openalex.org/W6688475801","https://openalex.org/W6696783566","https://openalex.org/W6729224713","https://openalex.org/W6736372492","https://openalex.org/W6736714129","https://openalex.org/W6738796088","https://openalex.org/W6747941106","https://openalex.org/W6756414846","https://openalex.org/W6757046686","https://openalex.org/W7011621630"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2348909947"],"abstract_inverted_index":{"As":[0],"urban":[1],"traffic":[2,13,28,64,90],"condition":[3],"is":[4,34,169],"diverse":[5],"and":[6,20,62,119,160,187,226,246,255],"complicated,":[7],"applying":[8],"reinforcement":[9,40],"learning":[10,41,58,100,132],"to":[11,25,56,108,144,154,171,190,213],"reduce":[12,161],"congestion":[14,254],"becomes":[15],"one":[16],"of":[17,31,112,130,167,175],"the":[18,27,60,98,110,116,128,157,162,173,176,205,210,216],"hot":[19],"promising":[21],"topics.":[22],"Especially,":[23],"how":[24],"coordinate":[26,123,247],"light":[29,91],"controllers":[30],"multiple":[32,248],"intersections":[33],"a":[35,71,233],"key":[36],"challenge":[37],"for":[38,89,194,224],"multi-agent":[39,73],"(MARL).":[42],"Most":[43],"existing":[44],"MARL":[45],"studies":[46],"are":[47],"based":[48,81],"on":[49,82],"traditional":[50],"Q-learning,":[51],"but":[52,207],"unstable":[53],"environment":[54,177],"leads":[55],"poor":[57,131],"in":[59,94,101,115,151,232,243],"complicated":[61],"dynamic":[63],"scenarios.":[65],"In":[66],"this":[67],"paper,":[68],"we":[69,200,219],"propose":[70],"novel":[72],"recurrent":[74],"deep":[75,83],"deterministic":[76,84],"policy":[77,85],"gradient":[78,86],"(MARDDPG)":[79],"algorithm":[80,88],"(DDPG)":[87],"control":[92],"(TLC)":[93],"vehiclar":[95],"networks.":[96],"Specifically,":[97],"centralized":[99],"each":[102,106,120,125,142,195],"critic":[103],"network":[104,235],"enables":[105,141],"agent":[107,121,143],"estimate":[109],"policies":[111],"other":[113],"agents":[114],"decision-making":[117],"process":[118,159],"can":[122,240],"with":[124],"other,":[126],"alleviating":[127],"problem":[129],"performance":[133],"caused":[134,178],"by":[135,179],"environmental":[136],"instability.":[137],"The":[138,165,229],"decentralized":[139],"execution":[140],"make":[145],"decisions":[146],"independently.":[147],"We":[148,183],"share":[149],"parameters":[150],"actor":[152],"networks":[153,189],"speed":[155],"up":[156],"training":[158],"memory":[163],"footprint.":[164],"addition":[166],"LSTM":[168],"beneficial":[170],"alleviate":[172],"instability":[174],"partial":[180],"observable":[181],"state.":[182],"utilize":[184],"surveillance":[185],"cameras":[186],"vehicular":[188,234],"collect":[191],"status":[192],"information":[193],"intersection.":[196,217],"Unlike":[197],"previous":[198],"work,":[199],"have":[201],"not":[202],"only":[203],"considered":[204,209],"vehicle":[206,253],"also":[208,220],"pedestrians":[211],"waiting":[212],"pass":[214],"through":[215],"Moreover,":[218],"set":[221],"different":[222],"priorities":[223],"buses":[225],"ordinary":[227],"vehicles.":[228],"experimental":[230],"results":[231],"show":[236],"that":[237],"our":[238],"method":[239],"run":[241],"stably":[242],"various":[244],"scenarios":[245],"intersections,":[249],"which":[250],"significantly":[251],"reduces":[252],"pedestrian":[256],"congestion.":[257]},"counts_by_year":[{"year":2026,"cited_by_count":12},{"year":2025,"cited_by_count":70},{"year":2024,"cited_by_count":72},{"year":2023,"cited_by_count":54},{"year":2022,"cited_by_count":37},{"year":2021,"cited_by_count":35},{"year":2020,"cited_by_count":4}],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-10-10T00:00:00"}
