{"id":"https://openalex.org/W2583813242","doi":"https://doi.org/10.1109/tits.2017.2725912","title":"Expert Level Control of Ramp Metering Based on Multi-Task Deep Reinforcement Learning","display_name":"Expert Level Control of Ramp Metering Based on Multi-Task Deep Reinforcement Learning","publication_year":2017,"publication_date":"2017-08-17","ids":{"openalex":"https://openalex.org/W2583813242","doi":"https://doi.org/10.1109/tits.2017.2725912","mag":"2583813242"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2017.2725912","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2017.2725912","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035711588","display_name":"Francois Belletti","orcid":"https://orcid.org/0000-0003-1172-7283"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Francois Belletti","raw_affiliation_strings":["Computer Science Deptartment, University of California at Berkeley, Berkeley, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Deptartment, University of California at Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063864170","display_name":"Daniel Haziza","orcid":null},"institutions":[{"id":"https://openalex.org/I142476485","display_name":"\u00c9cole Polytechnique","ror":"https://ror.org/05hy3tk52","country_code":"FR","type":"education","lineage":["https://openalex.org/I142476485","https://openalex.org/I4210145102"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Daniel Haziza","raw_affiliation_strings":["Ecole Polytechnique, Palaiseau, France"],"affiliations":[{"raw_affiliation_string":"Ecole Polytechnique, Palaiseau, France","institution_ids":["https://openalex.org/I142476485"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102923214","display_name":"Gabriel Gomes","orcid":"https://orcid.org/0000-0002-3258-0623"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gabriel Gomes","raw_affiliation_strings":["Institute of Transportation Studies, University of California at Berkeley, Berkeley, CA, USA"],"affiliations":[{"raw_affiliation_string":"Institute of Transportation Studies, University of California at Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021116704","display_name":"Alexandre M. Bayen","orcid":"https://orcid.org/0000-0002-6697-222X"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexandre M. Bayen","raw_affiliation_strings":["Department of Civil and Environmental Engineering","Institute of Transportation Studies, University of California at Berkeley, Berkeley, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Civil and Environmental Engineering","institution_ids":[]},{"raw_affiliation_string":"Institute of Transportation Studies, University of California at Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5035711588"],"corresponding_institution_ids":["https://openalex.org/I95457486"],"apc_list":null,"apc_paid":null,"fwci":12.2008,"has_fulltext":false,"cited_by_count":153,"citation_normalized_percentile":{"value":0.98941771,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"19","issue":"4","first_page":"1198","last_page":"1207"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7321345806121826},{"id":"https://openalex.org/keywords/discretization","display_name":"Discretization","score":0.6347579956054688},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5944643616676331},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.5798916220664978},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45413029193878174},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.418876588344574},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4140395224094391},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.33551836013793945},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20940938591957092},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1497189700603485}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7321345806121826},{"id":"https://openalex.org/C73000952","wikidata":"https://www.wikidata.org/wiki/Q17007827","display_name":"Discretization","level":2,"score":0.6347579956054688},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5944643616676331},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.5798916220664978},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45413029193878174},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.418876588344574},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4140395224094391},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.33551836013793945},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20940938591957092},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1497189700603485},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2017.2725912","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2017.2725912","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.5400000214576721,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W314779054","https://openalex.org/W1191599655","https://openalex.org/W1626957775","https://openalex.org/W1632785960","https://openalex.org/W1757796397","https://openalex.org/W1766637835","https://openalex.org/W1771410628","https://openalex.org/W2000359198","https://openalex.org/W2014847204","https://openalex.org/W2053330094","https://openalex.org/W2065672848","https://openalex.org/W2102348546","https://openalex.org/W2104733512","https://openalex.org/W2119717200","https://openalex.org/W2121103318","https://openalex.org/W2123859855","https://openalex.org/W2127107099","https://openalex.org/W2130801532","https://openalex.org/W2155007355","https://openalex.org/W2170290380","https://openalex.org/W2257979135","https://openalex.org/W2342662072","https://openalex.org/W2624967856","https://openalex.org/W2963634205","https://openalex.org/W2964006217","https://openalex.org/W2964161785","https://openalex.org/W4239943352","https://openalex.org/W4298857966","https://openalex.org/W6637930290","https://openalex.org/W6639949747","https://openalex.org/W6675999342","https://openalex.org/W6678367057","https://openalex.org/W6679257226","https://openalex.org/W6684859510","https://openalex.org/W6739580373"],"related_works":["https://openalex.org/W2364741597","https://openalex.org/W1492103595","https://openalex.org/W1864774435","https://openalex.org/W946352265","https://openalex.org/W3020787026","https://openalex.org/W2334479858","https://openalex.org/W2799209613","https://openalex.org/W1971388572","https://openalex.org/W1507702947","https://openalex.org/W2370926798"],"abstract_inverted_index":{"This":[0],"paper":[1],"shows":[2],"how":[3,126,321],"the":[4,38,46,52,85,115,131,154,171,184,188,191,202,219,241,270,288,291,298,325],"recent":[5],"breakthroughs":[6],"in":[7,107,293],"reinforcement":[8,247],"learning":[9,224,326],"(RL)":[10],"that":[11,34,114],"have":[12,98],"enabled":[13],"robots":[14],"to":[15,17,30,69,103,173,180,183,225,278,305],"learn":[16],"play":[18],"arcade":[19],"video":[20],"games,":[21],"walk,":[22],"or":[23],"assemble":[24],"colored":[25],"bricks,":[26],"can":[27,206],"be":[28,208],"used":[29],"perform":[31],"other":[32],"tasks":[33],"are":[35,91,138,276],"currently":[36],"at":[37],"core":[39],"of":[40,49,54,117,133,147,156,158,187,190,269,290],"engineering":[41,105],"cyberphysical":[42,228],"systems.":[43,77],"We":[44,124,143,233],"present":[45],"first":[47],"use":[48,70],"RL":[50,129,256],"for":[51,74,223,248],"control":[53,72,116,132,160,226,250,308,317],"systems":[55,79],"modeled":[56,93],"by":[57,94,162,244],"discretized":[58,134,198],"non-linear":[59],"partial":[60],"differential":[61],"equations":[62],"(PDEs)":[63],"and":[64,88,141,216,239,319],"devise":[65],"a":[66,100,211,254,260,266,307,314],"novel":[67],"algorithm":[68,146],"non-parametric":[71],"techniques":[73],"large":[75,227],"multi-agent":[76,159],"Cyberphysical":[78],"(e.g.,":[80],"hydraulic":[81],"channels,":[82],"transportation":[83],"systems,":[84],"energy":[86],"grid,":[87],"electromagnetic":[89],"systems)":[90],"commonly":[92],"PDEs,":[95],"which":[96,152,217],"historically":[97],"been":[99],"reliable":[101],"way":[102],"enable":[104],"applications":[106],"these":[108,118],"domains.":[109],"However,":[110],"it":[111,182,193],"is":[112,121,194],"known":[113],"PDE":[119,205,257],"models":[120],"notoriously":[122],"difficult.":[123],"show":[125,240,320],"neural":[127,255],"network-based":[128],"enables":[130],"PDEs":[135],"whose":[136],"parameters":[137,186],"unknown,":[139],"random,":[140],"time-varying.":[142],"introduce":[144],"an":[145],"mutual":[148],"weight":[149],"regularization":[150],"(MWR),":[151],"alleviates":[153],"curse":[155],"dimensionality":[157],"schemes":[161],"sharing":[163],"experience":[164],"between":[165],"agents":[166],"while":[167],"giving":[168],"each":[169],"agent":[170],"opportunity":[172],"specialize":[174],"its":[175],"action":[176],"policy":[177],"so":[178],"as":[179,201,210],"tailor":[181],"local":[185],"part":[189],"system":[192,229],"located":[195],"in.":[196],"A":[197],"PDE,":[199],"such":[200],"scalar":[203],"Lighthill-Whitham-Richards":[204],"indeed":[207],"considered":[209],"macroscopic":[212],"freeway":[213],"traffic":[214,261,294],"simulator":[215],"presents":[218],"most":[220],"salient":[221],"challenges":[222],"with":[230,297,312],"multiple":[231],"agents.":[232],"consider":[234],"two":[235],"different":[236],"discretization":[237,268],"procedures":[238],"opportunities":[242],"offered":[243],"applying":[245],"deep":[246],"continuous":[249],"on":[251,259,265,310],"both.":[252],"Using":[253],"controller":[258],"flow":[262],"simulation":[263],"based":[264],"Godunov":[267],"San":[271],"Francisco":[272],"Bay":[273],"Bridge,":[274],"we":[275,303],"able":[277],"achieve":[279,306],"precise":[280],"adaptive":[281],"metering":[282],"without":[283],"model":[284],"calibration":[285],"thereby":[286],"beating":[287],"state":[289],"art":[292],"metering.":[295],"Furthermore,":[296],"more":[299],"accurate":[300],"BeATS":[301],"simulator,":[302],"manage":[304],"performance":[309],"par":[311],"ALINEA,":[313],"state-of-the-art":[315],"parametric":[316],"scheme,":[318],"using":[322],"MWR":[323],"improves":[324],"procedure.":[327]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":25},{"year":2021,"cited_by_count":26},{"year":2020,"cited_by_count":25},{"year":2019,"cited_by_count":18},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":4}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
