{"id":"https://openalex.org/W3012104945","doi":"https://doi.org/10.1109/cdc40024.2019.9029961","title":"Reinforcement Learning Augmented Optimization for Smart Mobility","display_name":"Reinforcement Learning Augmented Optimization for Smart Mobility","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3012104945","doi":"https://doi.org/10.1109/cdc40024.2019.9029961","mag":"3012104945"},"language":"en","primary_location":{"id":"doi:10.1109/cdc40024.2019.9029961","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc40024.2019.9029961","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 58th Conference on Decision and Control (CDC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008042301","display_name":"Roman Overko","orcid":"https://orcid.org/0000-0001-5164-5675"},"institutions":[{"id":"https://openalex.org/I100930933","display_name":"University College Dublin","ror":"https://ror.org/05m7pjf47","country_code":"IE","type":"education","lineage":["https://openalex.org/I100930933"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Roman Overko","raw_affiliation_strings":["University College Dublin, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"University College Dublin, Dublin, Ireland","institution_ids":["https://openalex.org/I100930933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058500031","display_name":"Rodrigo Ord\u00f3\u00f1ez-Hurtado","orcid":"https://orcid.org/0000-0002-9053-8482"},"institutions":[{"id":"https://openalex.org/I4210145784","display_name":"IBM Research - Ireland","ror":"https://ror.org/04jnxr720","country_code":"IE","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210145784"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Rodrigo Ordonez-Hurtado","raw_affiliation_strings":["IBM Research, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"IBM Research, Dublin, Ireland","institution_ids":["https://openalex.org/I4210145784"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042402060","display_name":"Sergiy Zhuk","orcid":"https://orcid.org/0000-0002-0956-8909"},"institutions":[{"id":"https://openalex.org/I4210145784","display_name":"IBM Research - Ireland","ror":"https://ror.org/04jnxr720","country_code":"IE","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210145784"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Sergiy Zhuk","raw_affiliation_strings":["IBM Research, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"IBM Research, Dublin, Ireland","institution_ids":["https://openalex.org/I4210145784"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036373073","display_name":"Robert Shorten","orcid":"https://orcid.org/0000-0002-9239-2499"},"institutions":[{"id":"https://openalex.org/I100930933","display_name":"University College Dublin","ror":"https://ror.org/05m7pjf47","country_code":"IE","type":"education","lineage":["https://openalex.org/I100930933"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Robert Shorten","raw_affiliation_strings":["University College Dublin, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"University College Dublin, Dublin, Ireland","institution_ids":["https://openalex.org/I100930933"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008042301"],"corresponding_institution_ids":["https://openalex.org/I100930933"],"apc_list":null,"apc_paid":null,"fwci":0.1626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.59102589,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"57","issue":null,"first_page":"1286","last_page":"1292"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12546","display_name":"Smart Parking Systems Research","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12546","display_name":"Smart Parking Systems Research","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7638132572174072},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7629997134208679},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6984678506851196},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5644658803939819},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5052960515022278},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.47895199060440063},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4432508945465088},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4349391460418701},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35306912660598755},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1627815067768097},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1398961842060089}],"concepts":[{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7638132572174072},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7629997134208679},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6984678506851196},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5644658803939819},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5052960515022278},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.47895199060440063},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4432508945465088},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4349391460418701},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35306912660598755},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1627815067768097},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1398961842060089},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cdc40024.2019.9029961","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc40024.2019.9029961","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 58th Conference on Decision and Control (CDC)","raw_type":"proceedings-article"},{"id":"mag:3087228131","is_oa":false,"landing_page_url":"https://jglobal.jst.go.jp/en/detail?JGLOBAL_ID=202002261335453903","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.550000011920929,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1509991338","https://openalex.org/W1572161815","https://openalex.org/W1966431672","https://openalex.org/W1968459311","https://openalex.org/W1976843608","https://openalex.org/W1981612131","https://openalex.org/W1983057780","https://openalex.org/W2051894182","https://openalex.org/W2068181924","https://openalex.org/W2088595989","https://openalex.org/W2122124659","https://openalex.org/W2132276257","https://openalex.org/W2145457662","https://openalex.org/W2155856926","https://openalex.org/W2171033594","https://openalex.org/W2462689321","https://openalex.org/W2480177474","https://openalex.org/W2569271578","https://openalex.org/W2583813242","https://openalex.org/W2750990725","https://openalex.org/W2795942711","https://openalex.org/W2807760453","https://openalex.org/W2901712207","https://openalex.org/W2903709398","https://openalex.org/W2907953482","https://openalex.org/W2963338863","https://openalex.org/W4231389053","https://openalex.org/W4299805495","https://openalex.org/W6678276431","https://openalex.org/W6729807388","https://openalex.org/W6743617358","https://openalex.org/W6752126435","https://openalex.org/W6756699898","https://openalex.org/W6758223966","https://openalex.org/W7033776453"],"related_works":["https://openalex.org/W4400868993","https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894"],"abstract_inverted_index":{"Many":[0],"mobility":[1,97],"applications":[2],"in":[3],"smart":[4,96],"cities":[5],"are":[6,15,74,91,102],"addressed":[7],"as":[8,67,77],"optimization":[9],"problems.":[10],"However,":[11],"often,":[12],"these":[13],"problems":[14],"fragile":[16],"due":[17,26],"to":[18,27,46,53,86],"their":[19],"large-scale":[20],"and":[21,24,99],"non-convex":[22],"nature,":[23],"also":[25],"uncertainties":[28],"arising":[29],"because":[30],"of":[31,80,95],"human":[32],"activity.":[33],"In":[34],"this":[35,55],"paper,":[36],"we":[37,58],"apply":[38],"a":[39,51,78],"model-based":[40],"Markov-decision-process":[41],"(MDP)":[42],"closed-loop":[43],"identification":[44],"algorithm":[45],"augment":[47],"classical":[48,65],"optimizers,":[49],"with":[50,83,88],"view":[52],"alleviating":[54],"fragility.":[56],"Specifically,":[57],"use":[59],"deterministic":[60],"optimal":[61],"solutions":[62],"provided":[63],"by":[64],"optimizers":[66],"initial":[68],"guesses":[69],"for":[70],"MDP's":[71],"policies,":[72],"which":[73],"then":[75],"\"amended\"":[76],"result":[79],"online":[81],"interaction":[82],"the":[84],"environment":[85],"cope":[87],"uncertainty.":[89],"Applications":[90],"described":[92],"from":[93],"niche":[94],"problems,":[98],"numerical":[100],"results":[101],"provided.":[103]},"counts_by_year":[{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
