{"id":"https://openalex.org/W3176187537","doi":"https://doi.org/10.1109/tits.2021.3091014","title":"Using Reinforcement Learning to Control Traffic Signals in a Real-World Scenario: An Approach Based on Linear Function Approximation","display_name":"Using Reinforcement Learning to Control Traffic Signals in a Real-World Scenario: An Approach Based on Linear Function Approximation","publication_year":2021,"publication_date":"2021-06-29","ids":{"openalex":"https://openalex.org/W3176187537","doi":"https://doi.org/10.1109/tits.2021.3091014","mag":"3176187537"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2021.3091014","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2021.3091014","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025381800","display_name":"Lucas N. Alegre","orcid":"https://orcid.org/0000-0001-5465-4390"},"institutions":[{"id":"https://openalex.org/I130442723","display_name":"Universidade Federal do Rio Grande do Sul","ror":"https://ror.org/041yk2d64","country_code":"BR","type":"education","lineage":["https://openalex.org/I130442723"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Lucas N. Alegre","raw_affiliation_strings":["Institute of Informatics, Federal University of Rio Grande do Sul, Porto Alegre, Brazil"],"raw_orcid":"https://orcid.org/0000-0001-5465-4390","affiliations":[{"raw_affiliation_string":"Institute of Informatics, Federal University of Rio Grande do Sul, Porto Alegre, Brazil","institution_ids":["https://openalex.org/I130442723"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018222536","display_name":"Theresa Ziemke","orcid":"https://orcid.org/0000-0001-8812-9041"},"institutions":[{"id":"https://openalex.org/I4577782","display_name":"Technische Universit\u00e4t Berlin","ror":"https://ror.org/03v4gjf40","country_code":"DE","type":"education","lineage":["https://openalex.org/I4577782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Theresa Ziemke","raw_affiliation_strings":["Transport Systems Planning and Transport Telematics Department, Technische Universit&#x00E4;t Berlin, Berlin, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Transport Systems Planning and Transport Telematics Department, Technische Universit&#x00E4;t Berlin, Berlin, Germany","institution_ids":["https://openalex.org/I4577782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028225369","display_name":"Ana L. C. Bazzan","orcid":"https://orcid.org/0000-0002-2803-9607"},"institutions":[{"id":"https://openalex.org/I130442723","display_name":"Universidade Federal do Rio Grande do Sul","ror":"https://ror.org/041yk2d64","country_code":"BR","type":"education","lineage":["https://openalex.org/I130442723"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Ana L. C. Bazzan","raw_affiliation_strings":["Institute of Informatics, Federal University of Rio Grande do Sul, Porto Alegre, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-2803-9607","affiliations":[{"raw_affiliation_string":"Institute of Informatics, Federal University of Rio Grande do Sul, Porto Alegre, Brazil","institution_ids":["https://openalex.org/I130442723"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5025381800"],"corresponding_institution_ids":["https://openalex.org/I130442723"],"apc_list":null,"apc_paid":null,"fwci":4.1628,"has_fulltext":false,"cited_by_count":39,"citation_normalized_percentile":{"value":0.94445791,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"23","issue":"7","first_page":"9126","last_page":"9135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9196000099182129,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function approximation","score":0.6062678694725037},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5029165148735046},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4687519073486328},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.42276039719581604},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.41902679204940796},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.41475000977516174},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4117036759853363},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.37741607427597046},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36232423782348633},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.22460290789604187},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.1340952217578888},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.10032626986503601}],"concepts":[{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.6062678694725037},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5029165148735046},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4687519073486328},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.42276039719581604},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.41902679204940796},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.41475000977516174},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4117036759853363},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.37741607427597046},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36232423782348633},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.22460290789604187},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.1340952217578888},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.10032626986503601},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2021.3091014","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2021.3091014","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G179726332","display_name":null,"funder_award_id":"307215/2017-2","funder_id":"https://openalex.org/F4320322025","funder_display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico"},{"id":"https://openalex.org/G826270355","display_name":null,"funder_award_id":"140500/2021-9","funder_id":"https://openalex.org/F4320322025","funder_display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321091","display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","ror":"https://ror.org/00x0ma614"},{"id":"https://openalex.org/F4320322025","display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","ror":"https://ror.org/03swz6y49"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1496467067","https://openalex.org/W1517023921","https://openalex.org/W1530389486","https://openalex.org/W1559240825","https://openalex.org/W1646707810","https://openalex.org/W1678713393","https://openalex.org/W2020070197","https://openalex.org/W2024847969","https://openalex.org/W2033254849","https://openalex.org/W2054314161","https://openalex.org/W2061348089","https://openalex.org/W2082310090","https://openalex.org/W2088595989","https://openalex.org/W2106261932","https://openalex.org/W2121863487","https://openalex.org/W2134698488","https://openalex.org/W2139418546","https://openalex.org/W2144488633","https://openalex.org/W2160085675","https://openalex.org/W2269274350","https://openalex.org/W2292594870","https://openalex.org/W2480177474","https://openalex.org/W2725582697","https://openalex.org/W2766381093","https://openalex.org/W2800490665","https://openalex.org/W2801573006","https://openalex.org/W2809148419","https://openalex.org/W2914585077","https://openalex.org/W2946214056","https://openalex.org/W2946437866","https://openalex.org/W3103910758","https://openalex.org/W3121114425","https://openalex.org/W3123082711","https://openalex.org/W4214928630","https://openalex.org/W4255786593","https://openalex.org/W4295231058","https://openalex.org/W6601816729","https://openalex.org/W6629565041","https://openalex.org/W6631886163","https://openalex.org/W6633645324","https://openalex.org/W6637319420","https://openalex.org/W6637967152","https://openalex.org/W6696542365","https://openalex.org/W6704252352","https://openalex.org/W6785252774"],"related_works":["https://openalex.org/W2504004674","https://openalex.org/W1987679298","https://openalex.org/W2963177394","https://openalex.org/W4313359513","https://openalex.org/W2498744856","https://openalex.org/W4390482104","https://openalex.org/W322408318","https://openalex.org/W149041114","https://openalex.org/W3021988786","https://openalex.org/W3099311996"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,8],"is":[2,24,54,70,107,198],"an":[3,146],"efficient,":[4],"widely":[5],"used":[6,71],"machine":[7],"technique":[9],"that":[10,184,197,236],"performs":[11],"well":[12],"in":[13,76,143,164],"problems":[14],"with":[15,49,94,159],"a":[16,66,77,83,121,151,178,195],"reasonable":[17],"number":[18],"of":[19,52,79,114,123,145,153,156,219],"states":[20],"and":[21,118,150,228],"actions.":[22],"This":[23,109],"rarely":[25],"the":[26,38,50,112,154,202,212,220,231,234,238],"case":[27],"regarding":[28],"control-related":[29],"problems,":[30],"as":[31,60,209,211],"for":[32,233],"instance":[33],"controlling":[34],"traffic":[35,73],"signals,":[36],"where":[37],"state":[39],"space":[40],"can":[41],"be":[42],"very":[43],"large.":[44],"One":[45],"way":[46],"to":[47,55,129,172,177,201,225],"deal":[48],"curse":[51],"dimensionality":[53],"use":[56],"generalization":[57],"techniques":[58],"such":[59],"function":[61,68,125],"approximation.":[62,126],"In":[63,127],"this":[64],"paper,":[65],"linear":[67],"approximation":[69],"by":[72],"signal":[74],"agents":[75],"network":[78],"signalized":[80,161],"intersections.":[81],"Specifically,":[82],"true":[84],"online":[85],"SARSA":[86],"<inline-formula":[87,99,132,186],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[88,100,133,187],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[89,101,134,188],"<tex-math":[90,102,135,189],"notation=\"LaTeX\">$(\\lambda)$":[91],"</tex-math></inline-formula>":[92,105,138,192],"algorithm":[93],"Fourier":[95],"basis":[96],"functions":[97],"(TOS(":[98],"notation=\"LaTeX\">$\\lambda":[103,136,190],"$":[104,137,191],")-FB)":[106],"employed.":[108],"method":[110],"has":[111],"advantage":[113],"having":[115],"convergence":[116],"guarantees":[117],"error":[119],"bounds,":[120],"drawback":[122],"non-linear":[124],"order":[128],"evaluate":[130],"TOS(":[131,185],")-FB,":[139],"we":[140],"perform":[141],"experiments":[142],"variations":[144],"isolated":[147],"intersection":[148],"scenario":[149,152],"city":[155],"Cottbus,":[157],"Germany,":[158],"22":[160],"intersections,":[162,221],"implemented":[163],"MATSim.":[165],"We":[166],"compare":[167],"our":[168,222],"results":[169],"not":[170],"only":[171],"fixed-time":[173],"controllers,":[174],"but":[175],"also":[176,205],"state-of-the-art":[179],"rule-based":[180,213,239],"adaptive":[181],"method,":[182],"showing":[183],")-FB":[193],"shows":[194],"performance":[196],"highly":[199],"superior":[200],"fixed-time,":[203],"while":[204],"being":[206],"at":[207],"least":[208],"efficient":[210],"approach.":[214,240],"For":[215],"more":[216],"than":[217],"half":[218],"approach":[223],"leads":[224],"less":[226],"congestion":[227],"delay,":[229],"without":[230],"need":[232],"knowledge":[235],"underlies":[237]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
