{"id":"https://openalex.org/W3165002413","doi":"https://doi.org/10.1109/tiv.2022.3150668","title":"Safe Model-Based Off-Policy Reinforcement Learning for Eco-Driving in Connected and Automated Hybrid Electric Vehicles","display_name":"Safe Model-Based Off-Policy Reinforcement Learning for Eco-Driving in Connected and Automated Hybrid Electric Vehicles","publication_year":2022,"publication_date":"2022-02-15","ids":{"openalex":"https://openalex.org/W3165002413","doi":"https://doi.org/10.1109/tiv.2022.3150668","mag":"3165002413"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2022.3150668","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2022.3150668","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102007079","display_name":"Zhaoxuan Zhu","orcid":"https://orcid.org/0000-0003-3654-7318"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhaoxuan Zhu","raw_affiliation_strings":["Center for Automotive Research, The Ohio State University, Columbus, OH, USA"],"raw_orcid":"https://orcid.org/0000-0003-3654-7318","affiliations":[{"raw_affiliation_string":"Center for Automotive Research, The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067616003","display_name":"Nicola Pivaro","orcid":null},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicola Pivaro","raw_affiliation_strings":["Center for Automotive Research, The Ohio State University, Columbus, OH, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Automotive Research, The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079662689","display_name":"Shobhit Gupta","orcid":"https://orcid.org/0000-0001-5169-3263"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shobhit Gupta","raw_affiliation_strings":["Center for Automotive Research, The Ohio State University, Columbus, OH, USA"],"raw_orcid":"https://orcid.org/0000-0001-5169-3263","affiliations":[{"raw_affiliation_string":"Center for Automotive Research, The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017906439","display_name":"Abhishek Gupta","orcid":"https://orcid.org/0000-0003-1117-325X"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhishek Gupta","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The Ohio State University, Columbus, OH, USA"],"raw_orcid":"https://orcid.org/0000-0003-1117-325X","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075875954","display_name":"Marcello Canova","orcid":"https://orcid.org/0000-0003-1846-8894"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marcello Canova","raw_affiliation_strings":["Center for Automotive Research, The Ohio State University, Columbus, OH, USA"],"raw_orcid":"https://orcid.org/0000-0003-1846-8894","affiliations":[{"raw_affiliation_string":"Center for Automotive Research, The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102007079"],"corresponding_institution_ids":["https://openalex.org/I52357470"],"apc_list":null,"apc_paid":null,"fwci":4.2328,"has_fulltext":false,"cited_by_count":60,"citation_normalized_percentile":{"value":0.9473899,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"7","issue":"2","first_page":"387","last_page":"398"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12095","display_name":"Vehicle emissions and performance","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12095","display_name":"Vehicle emissions and performance","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10768","display_name":"Electric Vehicles and Infrastructure","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10808","display_name":"Electric and Hybrid Vehicle Technologies","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8687506914138794},{"id":"https://openalex.org/keywords/fuel-efficiency","display_name":"Fuel efficiency","score":0.666332483291626},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6610368490219116},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.6215552687644958},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6095170974731445},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5053487420082092},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45002442598342896},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41983795166015625},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.41938018798828125},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3229812681674957},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.22527247667312622},{"id":"https://openalex.org/keywords/automotive-engineering","display_name":"Automotive engineering","score":0.21353232860565186}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8687506914138794},{"id":"https://openalex.org/C45882903","wikidata":"https://www.wikidata.org/wiki/Q5042317","display_name":"Fuel efficiency","level":2,"score":0.666332483291626},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6610368490219116},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.6215552687644958},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6095170974731445},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5053487420082092},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45002442598342896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41983795166015625},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41938018798828125},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3229812681674957},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.22527247667312622},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.21353232860565186},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tiv.2022.3150668","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2022.3150668","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8700000047683716,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320317189","display_name":"Ohio Supercomputer Center","ror":"https://ror.org/01apna436"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1506660872","https://openalex.org/W1951216520","https://openalex.org/W1959608418","https://openalex.org/W1994755758","https://openalex.org/W2090715271","https://openalex.org/W2098432798","https://openalex.org/W2119717200","https://openalex.org/W2141559645","https://openalex.org/W2152938561","https://openalex.org/W2157525649","https://openalex.org/W2165150801","https://openalex.org/W2173248099","https://openalex.org/W2173564293","https://openalex.org/W2329039258","https://openalex.org/W2519091744","https://openalex.org/W2561463613","https://openalex.org/W2612281180","https://openalex.org/W2726187156","https://openalex.org/W2749680651","https://openalex.org/W2766971499","https://openalex.org/W2767650907","https://openalex.org/W2792321165","https://openalex.org/W2792764867","https://openalex.org/W2805762288","https://openalex.org/W2891048072","https://openalex.org/W2895520692","https://openalex.org/W2898917980","https://openalex.org/W2903709398","https://openalex.org/W2922501931","https://openalex.org/W2934606751","https://openalex.org/W2949382160","https://openalex.org/W2951004968","https://openalex.org/W2953708620","https://openalex.org/W2962872206","https://openalex.org/W2963704132","https://openalex.org/W2963923407","https://openalex.org/W2974094277","https://openalex.org/W2981426338","https://openalex.org/W2999905431","https://openalex.org/W3001132159","https://openalex.org/W3009331570","https://openalex.org/W3010456448","https://openalex.org/W3011120880","https://openalex.org/W3011432977","https://openalex.org/W3022566517","https://openalex.org/W3092793148","https://openalex.org/W3118263362","https://openalex.org/W3119708141","https://openalex.org/W3130729047","https://openalex.org/W3144678276","https://openalex.org/W3146188752","https://openalex.org/W3167874530","https://openalex.org/W3191611578","https://openalex.org/W4386952173","https://openalex.org/W6640820311","https://openalex.org/W6640963894","https://openalex.org/W6684205842","https://openalex.org/W6684921986","https://openalex.org/W6685444567","https://openalex.org/W6740222838","https://openalex.org/W6748839928","https://openalex.org/W6749825310","https://openalex.org/W6751494529","https://openalex.org/W6755864697","https://openalex.org/W6757469721","https://openalex.org/W6775261052","https://openalex.org/W6775686901","https://openalex.org/W6776438516"],"related_works":["https://openalex.org/W2383111961","https://openalex.org/W2365952365","https://openalex.org/W2352448290","https://openalex.org/W2380820513","https://openalex.org/W2913146933","https://openalex.org/W2372385138","https://openalex.org/W4296359239","https://openalex.org/W2101155126","https://openalex.org/W2043093291","https://openalex.org/W2018658498"],"abstract_inverted_index":{"Deep":[0],"Reinforcement":[1,34],"Learning":[2,35],"(DRL)":[3],"has":[4],"recently":[5],"been":[6],"applied":[7],"to":[8,10,166,180],"eco-driving":[9],"intelligently":[11],"reduce":[12],"fuel":[13,152,174],"consumption":[14,153],"and":[15,23,57,76,142,170,184],"travel":[16],"time.":[17],"While":[18],"previous":[19],"studies":[20],"synthesize":[21],"simulators":[22],"model-free":[24],"DRL":[25],"(MFDRL),":[26],"this":[27],"work":[28],"proposes":[29],"a":[30,46,52,58,80,109,127,133,137,172],"Safe":[31],"Off-policy":[32],"Model-Based":[33],"(SMORL)":[36],"algorithm":[37],"for":[38,97],"eco-driving.":[39],"SMORL":[40,120,149],"integrates":[41],"three":[42],"key":[43],"components,":[44],"namely":[45],"computationally":[47],"efficient":[48],"model-based":[49],"trajectory":[50,104],"optimizer,":[51],"value":[53],"function":[54],"learned":[55,59],"off-policy":[56,74],"safe":[60,110],"set.":[61],"The":[62,117],"advantages":[63],"over":[64,123],"the":[65,71,77,84,88,101,143,151,160,167,181,185],"existing":[66],"literature":[67],"are":[68],"three-fold.":[69],"First,":[70],"combination":[72],"of":[73,79,103,119],"learning":[75],"use":[78],"physics-based":[81],"model":[82],"improves":[83],"sample":[85],"efficiency.":[86],"Second,":[87],"training":[89],"does":[90],"not":[91],"require":[92],"any":[93],"extrinsic":[94],"rewarding":[95],"mechanism":[96],"constraint":[98],"satisfaction.":[99],"Third,":[100],"feasibility":[102],"is":[105,121],"guaranteed":[106],"by":[107,113,154],"using":[108],"set":[111],"approximated":[112],"deep":[114],"generative":[115],"models.":[116],"performance":[118],"benchmarked":[122],"100":[124],"trips":[125],"against":[126],"baseline":[128,168],"controller":[129,169],"representing":[130],"human":[131],"drivers,":[132],"non-learning-based":[134,186],"optimal":[135,145,187],"controller,":[136],"previously":[138],"designed":[139],"MFDRL":[140,182],"strategy,":[141],"wait-and-see":[144],"solution.":[146],"In":[147],"simulation,":[148],"reduces":[150],"more":[155],"than":[156],"21%":[157],"while":[158,164,176],"keeping":[159],"average":[161],"speed":[162],"comparable":[163],"compared":[165,179],"demonstrates":[171],"better":[173],"economy":[175],"driving":[177],"faster":[178],"agent":[183],"controller.":[188]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":21},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":2}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
