{"id":"https://openalex.org/W2989915408","doi":"https://doi.org/10.1109/itsc.2019.8917268","title":"A Reinforcement Learning Approach for Intelligent Traffic Signal Control at Urban Intersections","display_name":"A Reinforcement Learning Approach for Intelligent Traffic Signal Control at Urban Intersections","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2989915408","doi":"https://doi.org/10.1109/itsc.2019.8917268","mag":"2989915408"},"language":"en","primary_location":{"id":"doi:10.1109/itsc.2019.8917268","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc.2019.8917268","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Intelligent Transportation Systems Conference (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030001296","display_name":"Mengyu Guo","orcid":"https://orcid.org/0000-0002-9953-0073"},"institutions":[{"id":"https://openalex.org/I1304598786","display_name":"Program for Appropriate Technology in Health","ror":"https://ror.org/02ycvrx49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1304598786"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mengyu Guo","raw_affiliation_strings":["California PATH, University of California, Berkeley, Richmond, CA, USA"],"affiliations":[{"raw_affiliation_string":"California PATH, University of California, Berkeley, Richmond, CA, USA","institution_ids":["https://openalex.org/I1304598786","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100735652","display_name":"Pin Wang","orcid":"https://orcid.org/0000-0002-1400-4497"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I1304598786","display_name":"Program for Appropriate Technology in Health","ror":"https://ror.org/02ycvrx49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1304598786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pin Wang","raw_affiliation_strings":["California PATH, University of California, Berkeley, Richmond, CA, USA"],"affiliations":[{"raw_affiliation_string":"California PATH, University of California, Berkeley, Richmond, CA, USA","institution_ids":["https://openalex.org/I1304598786","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014661259","display_name":"Ching\u2010Yao Chan","orcid":"https://orcid.org/0000-0003-3992-2312"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]},{"id":"https://openalex.org/I1304598786","display_name":"Program for Appropriate Technology in Health","ror":"https://ror.org/02ycvrx49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1304598786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ching-Yao Chan","raw_affiliation_strings":["California PATH, University of California, Berkeley, Richmond, CA, USA"],"affiliations":[{"raw_affiliation_string":"California PATH, University of California, Berkeley, Richmond, CA, USA","institution_ids":["https://openalex.org/I1304598786","https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078079598","display_name":"Sid Askary","orcid":null},"institutions":[{"id":"https://openalex.org/I4210146936","display_name":"Huawei Technologies (United States)","ror":"https://ror.org/03jyqk712","country_code":"US","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210146936"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sid Askary","raw_affiliation_strings":["Futurewei Technologies, Inc., Santa Clara, CA, USA"],"affiliations":[{"raw_affiliation_string":"Futurewei Technologies, Inc., Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210146936"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5030001296"],"corresponding_institution_ids":["https://openalex.org/I1304598786","https://openalex.org/I95457486"],"apc_list":null,"apc_paid":null,"fwci":4.8864,"has_fulltext":false,"cited_by_count":81,"citation_normalized_percentile":{"value":0.95677838,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4242","last_page":"4247"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7252400517463684},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6800637245178223},{"id":"https://openalex.org/keywords/traffic-generation-model","display_name":"Traffic generation model","score":0.5939030051231384},{"id":"https://openalex.org/keywords/traffic-congestion-reconstruction-with-kerners-three-phase-theory","display_name":"Traffic congestion reconstruction with Kerner's three-phase theory","score":0.522713303565979},{"id":"https://openalex.org/keywords/floating-car-data","display_name":"Floating car data","score":0.48610472679138184},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.48542651534080505},{"id":"https://openalex.org/keywords/traffic-congestion","display_name":"Traffic congestion","score":0.45590537786483765},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.4424440562725067},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.43854567408561707},{"id":"https://openalex.org/keywords/traffic-simulation","display_name":"Traffic simulation","score":0.41822999715805054},{"id":"https://openalex.org/keywords/traffic-flow","display_name":"Traffic flow (computer networking)","score":0.41300472617149353},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.32711705565452576},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2841661274433136},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.2636316120624542},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.22294124960899353},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2143576443195343},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.1882058084011078}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7252400517463684},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6800637245178223},{"id":"https://openalex.org/C176715033","wikidata":"https://www.wikidata.org/wiki/Q2080768","display_name":"Traffic generation model","level":2,"score":0.5939030051231384},{"id":"https://openalex.org/C25492975","wikidata":"https://www.wikidata.org/wiki/Q960570","display_name":"Traffic congestion reconstruction with Kerner's three-phase theory","level":3,"score":0.522713303565979},{"id":"https://openalex.org/C64093975","wikidata":"https://www.wikidata.org/wiki/Q356677","display_name":"Floating car data","level":3,"score":0.48610472679138184},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.48542651534080505},{"id":"https://openalex.org/C2779888511","wikidata":"https://www.wikidata.org/wiki/Q244156","display_name":"Traffic congestion","level":2,"score":0.45590537786483765},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4424440562725067},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.43854567408561707},{"id":"https://openalex.org/C2778391309","wikidata":"https://www.wikidata.org/wiki/Q7832527","display_name":"Traffic simulation","level":3,"score":0.41822999715805054},{"id":"https://openalex.org/C207512268","wikidata":"https://www.wikidata.org/wiki/Q3074551","display_name":"Traffic flow (computer networking)","level":2,"score":0.41300472617149353},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.32711705565452576},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2841661274433136},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.2636316120624542},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.22294124960899353},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2143576443195343},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.1882058084011078},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/itsc.2019.8917268","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc.2019.8917268","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Intelligent Transportation Systems Conference (ITSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.8299999833106995}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W41554520","https://openalex.org/W573924038","https://openalex.org/W1536680647","https://openalex.org/W1869778509","https://openalex.org/W1969758122","https://openalex.org/W2013961309","https://openalex.org/W2037067712","https://openalex.org/W2037248853","https://openalex.org/W2095733895","https://openalex.org/W2115211925","https://openalex.org/W2121863487","https://openalex.org/W2142842987","https://openalex.org/W2145339207","https://openalex.org/W2173564293","https://openalex.org/W2201581102","https://openalex.org/W2498017881","https://openalex.org/W2610461071","https://openalex.org/W2802508687","https://openalex.org/W2809148419","https://openalex.org/W2811198925","https://openalex.org/W2898015307","https://openalex.org/W2904906709","https://openalex.org/W2951799221","https://openalex.org/W2963477884","https://openalex.org/W2964247745","https://openalex.org/W3106357768","https://openalex.org/W6639086533","https://openalex.org/W6685444567","https://openalex.org/W6687681856","https://openalex.org/W6746966444","https://openalex.org/W6948057359"],"related_works":["https://openalex.org/W2972320057","https://openalex.org/W2587362999","https://openalex.org/W4386289889","https://openalex.org/W3117279048","https://openalex.org/W2945875309","https://openalex.org/W2410941711","https://openalex.org/W2009112536","https://openalex.org/W2898775471","https://openalex.org/W4391811515","https://openalex.org/W2161957991"],"abstract_inverted_index":{"Ineffective":[0],"and":[1,17,21,108,129,146,187,213,231],"inflexible":[2],"traffic":[3,15,27,39,51,76,97,123,136,164,175,195,205,239],"signal":[4,31,52,77,98,137,196,240],"control":[5,32,53,78,99,148,197],"at":[6,79],"urban":[7,38,80,156,169],"intersections":[8],"can":[9,105,112,200],"often":[10],"lead":[11],"to":[12,25,63,92,166,191,203],"bottlenecks":[13],"in":[14,37,44,142,226,238],"flows":[16],"cause":[18],"congestion,":[19],"delay,":[20],"environmental":[22],"problems.":[23],"How":[24],"manage":[26],"smartly":[28],"by":[29],"intelligent":[30],"is":[33,118],"a":[34,60,72,144,193],"big":[35],"challenge":[36],"management.":[40],"With":[41],"recent":[42],"advances":[43],"machine":[45,56],"learning,":[46],"especially":[47],"reinforcement":[48],"learning":[49,57],"(RL),":[50],"using":[54],"advanced":[55],"techniques":[58],"represents":[59],"promising":[61],"solution":[62],"tackle":[64],"this":[65,68],"problem.":[66],"In":[67],"paper,":[69],"we":[70,83,172],"propose":[71],"RL":[73,218],"approach":[74,219],"for":[75],"intersections.":[81,170],"Specifically,":[82],"use":[84,159,173],"neural":[85],"networks":[86],"as":[87,178,220,222],"Q-function":[88],"approximator":[89],"(a.k.a.":[90],"Q-network)":[91],"deal":[93],"with":[94],"the":[95,102,109,151,211],"complex":[96],"problem":[100],"where":[101],"state":[103,116],"space":[104,111,117,133],"be":[106,113,201],"huge":[107],"action":[110,132],"discrete.":[114],"The":[115,131,207],"defined":[119],"based":[120],"on":[121],"real-time":[122],"information,":[124],"i.e.":[125],"vehicle":[126],"position,":[127],"direction":[128],"speed.":[130],"includes":[134],"various":[135,204],"phases":[138],"which":[139],"are":[140],"critical":[141],"generating":[143],"reasonable":[145],"realistic":[147,168],"mechanism,":[149],"given":[150],"prominent":[152],"spatial-temporal":[153],"characteristics":[154],"of":[155,216,228],"traffic.":[157],"We":[158],"SUMO,":[160],"an":[161],"open":[162],"source":[163],"simulator,":[165],"construct":[167],"Moreover,":[171],"different":[174],"patterns,":[176],"such":[177],"major/minor":[179],"road":[180],"traffic,":[181,184,186,190],"through/left-turn":[182],"lane":[183],"tidal":[185],"varying":[188],"demand":[189],"train":[192],"generalized":[194],"model":[198],"that":[199],"adapted":[202],"conditions.":[206],"simulation":[208],"results":[209],"demonstrate":[210],"convergence":[212],"generalization":[214],"performance":[215],"our":[217],"well":[221],"its":[223],"significant":[224],"benefits":[225],"terms":[227],"queue":[229],"length":[230],"wait":[232],"time":[233],"over":[234],"several":[235],"benchmarking":[236],"methods":[237],"control.":[241]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":17},{"year":2023,"cited_by_count":19},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":6}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
