{"id":"https://openalex.org/W2933570795","doi":"https://doi.org/10.1109/tcyb.2019.2904742","title":"Cooperative Deep Reinforcement Learning for Large-Scale Traffic Grid Signal Control","display_name":"Cooperative Deep Reinforcement Learning for Large-Scale Traffic Grid Signal Control","publication_year":2019,"publication_date":"2019-03-29","ids":{"openalex":"https://openalex.org/W2933570795","doi":"https://doi.org/10.1109/tcyb.2019.2904742","mag":"2933570795","pmid":"https://pubmed.ncbi.nlm.nih.gov/30946688"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2019.2904742","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2019.2904742","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101667380","display_name":"Tian Tan","orcid":"https://orcid.org/0000-0001-9173-2984"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tian Tan","raw_affiliation_strings":["Department of Civil and Environmental Engineering, Stanford University, Stanford, USA"],"raw_orcid":"https://orcid.org/0000-0001-9173-2984","affiliations":[{"raw_affiliation_string":"Department of Civil and Environmental Engineering, Stanford University, Stanford, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022735755","display_name":"Feng Bao","orcid":"https://orcid.org/0000-0002-5721-9551"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Bao","raw_affiliation_strings":["Department of Automation, Tsinghua National Laboratory for Information Science and Technology, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5721-9551","affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua National Laboratory for Information Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082404485","display_name":"Yue Deng","orcid":"https://orcid.org/0000-0003-2871-8922"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Deng","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2871-8922","affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085670252","display_name":"Alex Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Jin","raw_affiliation_strings":["Computer Science Department, Stanford University, Stanford, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, Stanford, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080722708","display_name":"Qionghai Dai","orcid":"https://orcid.org/0000-0001-7043-3061"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qionghai Dai","raw_affiliation_strings":["Department of Automation, Tsinghua National Laboratory for Information Science and Technology, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7043-3061","affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua National Laboratory for Information Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101422661","display_name":"Jie Wang","orcid":"https://orcid.org/0000-0003-1857-5569"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jie Wang","raw_affiliation_strings":["Department of Civil and Environmental Engineering, Stanford University, Stanford, USA"],"raw_orcid":"https://orcid.org/0000-0003-1857-5569","affiliations":[{"raw_affiliation_string":"Department of Civil and Environmental Engineering, Stanford University, Stanford, USA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101667380"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":19.892,"has_fulltext":false,"cited_by_count":228,"citation_normalized_percentile":{"value":0.99632682,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"50","issue":"6","first_page":"2687","last_page":"2700"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9035905003547668},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7602137327194214},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.6635197401046753},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.5029222369194031},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4694347381591797},{"id":"https://openalex.org/keywords/traffic-simulation","display_name":"Traffic simulation","score":0.4285098910331726},{"id":"https://openalex.org/keywords/intelligent-transportation-system","display_name":"Intelligent transportation system","score":0.4268588423728943},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34642165899276733},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.14902186393737793},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09464713931083679},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.08876687288284302},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0725502073764801}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9035905003547668},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7602137327194214},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.6635197401046753},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.5029222369194031},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4694347381591797},{"id":"https://openalex.org/C2778391309","wikidata":"https://www.wikidata.org/wiki/Q7832527","display_name":"Traffic simulation","level":3,"score":0.4285098910331726},{"id":"https://openalex.org/C47796450","wikidata":"https://www.wikidata.org/wiki/Q508378","display_name":"Intelligent transportation system","level":2,"score":0.4268588423728943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34642165899276733},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.14902186393737793},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09464713931083679},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.08876687288284302},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0725502073764801},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2019.2904742","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2019.2904742","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:30946688","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/30946688","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1834506735","display_name":null,"funder_award_id":"Z181100003118014","funder_id":"https://openalex.org/F4320325902","funder_display_name":"Beijing Municipal Science and Technology Commission"},{"id":"https://openalex.org/G8883308132","display_name":null,"funder_award_id":"61327902","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"},{"id":"https://openalex.org/F4320325902","display_name":"Beijing Municipal Science and Technology Commission","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W6043852","https://openalex.org/W32403112","https://openalex.org/W138497752","https://openalex.org/W1522301498","https://openalex.org/W1543115993","https://openalex.org/W1600744878","https://openalex.org/W1678713393","https://openalex.org/W1869778509","https://openalex.org/W1928215159","https://openalex.org/W1986659999","https://openalex.org/W1999371911","https://openalex.org/W2024564885","https://openalex.org/W2031530760","https://openalex.org/W2048041430","https://openalex.org/W2060338093","https://openalex.org/W2074500080","https://openalex.org/W2076063813","https://openalex.org/W2088171019","https://openalex.org/W2088595989","https://openalex.org/W2096538655","https://openalex.org/W2101786389","https://openalex.org/W2117359296","https://openalex.org/W2121863487","https://openalex.org/W2145143778","https://openalex.org/W2145339207","https://openalex.org/W2146087064","https://openalex.org/W2153002112","https://openalex.org/W2154997814","https://openalex.org/W2156271471","https://openalex.org/W2156387975","https://openalex.org/W2159721029","https://openalex.org/W2160085675","https://openalex.org/W2173248099","https://openalex.org/W2201581102","https://openalex.org/W2209913494","https://openalex.org/W2215378786","https://openalex.org/W2334782222","https://openalex.org/W2344786740","https://openalex.org/W2485902895","https://openalex.org/W2498017881","https://openalex.org/W2529203006","https://openalex.org/W2548134372","https://openalex.org/W2551113280","https://openalex.org/W2564150501","https://openalex.org/W2604427121","https://openalex.org/W2618682531","https://openalex.org/W2747046834","https://openalex.org/W2792596411","https://openalex.org/W2919115771","https://openalex.org/W2963011350","https://openalex.org/W2963864421","https://openalex.org/W2964121744","https://openalex.org/W3103910758","https://openalex.org/W4214717370","https://openalex.org/W4394672593","https://openalex.org/W6600255050","https://openalex.org/W6605711098","https://openalex.org/W6631190155","https://openalex.org/W6632417921","https://openalex.org/W6637319420","https://openalex.org/W6639086533","https://openalex.org/W6682889407","https://openalex.org/W6684921986","https://openalex.org/W6687681856","https://openalex.org/W6729224713","https://openalex.org/W6743051084","https://openalex.org/W7001212498"],"related_works":["https://openalex.org/W2364252372","https://openalex.org/W4234066492","https://openalex.org/W4306904969","https://openalex.org/W1998063895","https://openalex.org/W1967044713","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2133470120"],"abstract_inverted_index":{"Exploiting":[0],"reinforcement":[1,92],"learning":[2,93],"(RL)":[3],"for":[4],"traffic":[5,39,46,61,77,172,199],"congestion":[6],"reduction":[7],"is":[8,50,100],"a":[9,45,59,85,89,109,127,143],"frontier":[10],"topic":[11],"in":[12,18,41,188,201],"intelligent":[13],"transportation":[14],"research.":[15],"The":[16,96,174],"difficulty":[17],"this":[19,80],"problem":[20,86],"stems":[21],"from":[22,158],"the":[23,26,64,71,76,103,150,164,169,179,191],"inability":[24],"of":[25,44,73,111,190,193],"RL":[27,65,106,116,137,156],"agent":[28,133,153],"simultaneously":[29],"monitoring":[30],"multiple":[31,123],"signal":[32],"lights":[33],"when":[34,54],"taking":[35],"into":[36],"account":[37],"complicated":[38],"dynamics":[40],"different":[42,159],"regions":[43],"system.":[47],"Such":[48],"challenge":[49],"even":[51],"more":[52],"outstanding":[53],"forming":[55],"control":[56],"decisions":[57],"on":[58,184],"large-scale":[60,171],"grid,":[62],"where":[63],"action":[66],"space":[67],"grows":[68],"exponentially":[69],"with":[70,113,122,146],"number":[72,110,192],"intersections":[74],"within":[75],"grid.":[78,173],"In":[79],"paper,":[81],"we":[82,119],"tackle":[83],"such":[84],"by":[87],"proposing":[88],"cooperative":[90],"deep":[91],"(Coder)":[94],"framework.":[95],"intuition":[97],"behind":[98],"Coder":[99,121,181],"to":[101],"decompose":[102],"original":[104],"difficult":[105],"task":[107],"as":[108],"subproblems":[112],"relatively":[114],"easy":[115],"goals.":[117],"Accordingly,":[118],"implement":[120],"regional":[124,132,160],"agents":[125,161],"and":[126,139,162],"centralized":[128,151],"global":[129,152],"agent.":[130],"Each":[131],"learns":[134],"its":[135],"own":[136],"policy":[138],"value":[140],"functions":[141],"over":[142,168],"small":[144],"region":[145],"limited":[147],"actions.":[148],"Then,":[149],"hierarchically":[154],"aggregates":[155],"achievements":[157],"forms":[163],"final":[165],"Q":[166],"-function":[167],"entire":[170],"experimental":[175],"investigations":[176],"demonstrate":[177],"that":[178],"proposed":[180],"could":[182],"reduce":[183],"average":[185],"30%":[186],"congestions":[187],"terms":[189],"waiting":[194],"vehicles":[195],"during":[196],"high":[197],"density":[198],"flows":[200],"simulations.":[202]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":25},{"year":2024,"cited_by_count":38},{"year":2023,"cited_by_count":40},{"year":2022,"cited_by_count":43},{"year":2021,"cited_by_count":44},{"year":2020,"cited_by_count":26},{"year":2019,"cited_by_count":5}],"updated_date":"2026-05-16T08:24:45.110214","created_date":"2025-10-10T00:00:00"}
