{"id":"https://openalex.org/W4377022102","doi":"https://doi.org/10.1080/23307706.2023.2195408","title":"Multi-agent deep reinforcement learning with traffic flow for traffic signal control","display_name":"Multi-agent deep reinforcement learning with traffic flow for traffic signal control","publication_year":2023,"publication_date":"2023-05-18","ids":{"openalex":"https://openalex.org/W4377022102","doi":"https://doi.org/10.1080/23307706.2023.2195408"},"language":"en","primary_location":{"id":"doi:10.1080/23307706.2023.2195408","is_oa":false,"landing_page_url":"https://doi.org/10.1080/23307706.2023.2195408","pdf_url":null,"source":{"id":"https://openalex.org/S2475925340","display_name":"Journal of Control and Decision","issn_l":"2330-7706","issn":["2330-7706","2330-7714"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Control and Decision","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088339001","display_name":"Liang Hou","orcid":"https://orcid.org/0000-0002-0151-6987"},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Hou","raw_affiliation_strings":["College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China","institution_ids":["https://openalex.org/I22716506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065445833","display_name":"Dailin Huang","orcid":"https://orcid.org/0000-0003-0750-137X"},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Dailin Huang","raw_affiliation_strings":["College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China"],"raw_orcid":"https://orcid.org/0000-0003-0750-137X","affiliations":[{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China","institution_ids":["https://openalex.org/I22716506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101752375","display_name":"Jie Cao","orcid":"https://orcid.org/0000-0003-0481-5170"},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Cao","raw_affiliation_strings":["College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","Engineering Research Center of Manufacturing Information of Gansu Province, Lanzhou, People\u2019s Republic of China","College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China","Engineering Research Center of Manufacturing Information of Gansu Province, Lanzhou, People's Republic of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"Engineering Research Center of Manufacturing Information of Gansu Province, Lanzhou, People\u2019s Republic of China","institution_ids":[]},{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"Engineering Research Center of Manufacturing Information of Gansu Province, Lanzhou, People's Republic of China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046172069","display_name":"Jialin Ma","orcid":"https://orcid.org/0000-0003-3255-4158"},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialin Ma","raw_affiliation_strings":["College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China"],"raw_orcid":"https://orcid.org/0000-0003-3255-4158","affiliations":[{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People\u2019s Republic of China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"College of Computer and Communication, Lanzhou University of Technology, Lanzhou, People's Republic of China","institution_ids":["https://openalex.org/I22716506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5065445833"],"corresponding_institution_ids":["https://openalex.org/I22716506"],"apc_list":null,"apc_paid":null,"fwci":0.8967,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.73443535,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"12","issue":"1","first_page":"81","last_page":"92"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10698","display_name":"Transportation Planning and Optimization","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8155868649482727},{"id":"https://openalex.org/keywords/traffic-flow","display_name":"Traffic flow (computer networking)","score":0.7032716870307922},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.6970596313476562},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.6327048540115356},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6177130937576294},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.5129156112670898},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.4915812909603119},{"id":"https://openalex.org/keywords/traffic-congestion-reconstruction-with-kerners-three-phase-theory","display_name":"Traffic congestion reconstruction with Kerner's three-phase theory","score":0.4493850767612457},{"id":"https://openalex.org/keywords/flow-control","display_name":"Flow control (data)","score":0.440178781747818},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.41859573125839233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33586758375167847},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23880666494369507},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.2283969223499298},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.1817266345024109},{"id":"https://openalex.org/keywords/traffic-congestion","display_name":"Traffic congestion","score":0.15621721744537354}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8155868649482727},{"id":"https://openalex.org/C207512268","wikidata":"https://www.wikidata.org/wiki/Q3074551","display_name":"Traffic flow (computer networking)","level":2,"score":0.7032716870307922},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.6970596313476562},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.6327048540115356},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6177130937576294},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.5129156112670898},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.4915812909603119},{"id":"https://openalex.org/C25492975","wikidata":"https://www.wikidata.org/wiki/Q960570","display_name":"Traffic congestion reconstruction with Kerner's three-phase theory","level":3,"score":0.4493850767612457},{"id":"https://openalex.org/C186766456","wikidata":"https://www.wikidata.org/wiki/Q612457","display_name":"Flow control (data)","level":2,"score":0.440178781747818},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.41859573125839233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33586758375167847},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23880666494369507},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2283969223499298},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.1817266345024109},{"id":"https://openalex.org/C2779888511","wikidata":"https://www.wikidata.org/wiki/Q244156","display_name":"Traffic congestion","level":2,"score":0.15621721744537354},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1080/23307706.2023.2195408","is_oa":false,"landing_page_url":"https://doi.org/10.1080/23307706.2023.2195408","pdf_url":null,"source":{"id":"https://openalex.org/S2475925340","display_name":"Journal of Control and Decision","issn_l":"2330-7706","issn":["2330-7706","2330-7714"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Control and Decision","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G3325744198","display_name":null,"funder_award_id":"617630 28","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1482192533","https://openalex.org/W2058928902","https://openalex.org/W2104729914","https://openalex.org/W2112922813","https://openalex.org/W2120387195","https://openalex.org/W2129244926","https://openalex.org/W2145339207","https://openalex.org/W2155027007","https://openalex.org/W2165150801","https://openalex.org/W2492794003","https://openalex.org/W2622764302","https://openalex.org/W2734335288","https://openalex.org/W2746553466","https://openalex.org/W2766381093","https://openalex.org/W2794842204","https://openalex.org/W2809148419","https://openalex.org/W2915117209","https://openalex.org/W2917370556","https://openalex.org/W2933570795","https://openalex.org/W2965341638","https://openalex.org/W2983178256","https://openalex.org/W3023917962","https://openalex.org/W3106357768","https://openalex.org/W4231286818","https://openalex.org/W6688475801"],"related_works":["https://openalex.org/W4391115038","https://openalex.org/W1982014942","https://openalex.org/W1993589848","https://openalex.org/W2375665878","https://openalex.org/W2053400739","https://openalex.org/W2074943018","https://openalex.org/W2587362999","https://openalex.org/W4246936610","https://openalex.org/W4390987329","https://openalex.org/W2370594732"],"abstract_inverted_index":{"Multi-agent":[0],"Reinforcement":[1,71],"Learning":[2,72],"(MARL)":[3],"has":[4],"become":[5],"one":[6],"of":[7],"the":[8,51,67,81,86,94,102],"best":[9],"methods":[10],"in":[11,70],"Adaptive":[12],"Traffic":[13,17],"Signal":[14],"Control":[15],"(ATSC).":[16],"flow":[18,41,54,64],"is":[19,26,45,77],"a":[20,59],"very":[21],"regular":[22,82],"traffic":[23,40,53,63],"volume,":[24],"which":[25],"highly":[27],"critical":[28],"to":[29,47,66],"signal":[30],"control":[31,35],"policy.":[32],"However,":[33],"dynamic":[34],"policies":[36],"will":[37],"directly":[38],"affect":[39],"formation,":[42],"and":[43,85,97],"it":[44,76],"impossible":[46],"provide":[48],"observation":[49],"through":[50],"original":[52,103],"prediction.":[55],"This":[56],"paper":[57],"proposes":[58],"method":[60,91],"for":[61],"estimating":[62],"according":[65],"time":[68],"window":[69],"(RL)":[73],"training.":[74],"Therefore,":[75],"verified":[78],"on":[79],"both":[80],"road":[83,88],"network":[84],"real":[87],"network.":[89],"Our":[90],"further":[92],"reduces":[93],"intersection":[95],"delay":[96],"queue":[98],"length":[99],"compared":[100],"with":[101],"method.":[104]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
