{"id":"https://openalex.org/W4391768741","doi":"https://doi.org/10.1109/itsc57777.2023.10422605","title":"Safety Reinforced Model Predictive Control (SRMPC): Improving MPC with Reinforcement Learning for Motion Planning in Autonomous Driving","display_name":"Safety Reinforced Model Predictive Control (SRMPC): Improving MPC with Reinforcement Learning for Motion Planning in Autonomous Driving","publication_year":2023,"publication_date":"2023-09-24","ids":{"openalex":"https://openalex.org/W4391768741","doi":"https://doi.org/10.1109/itsc57777.2023.10422605"},"language":"en","primary_location":{"id":"doi:10.1109/itsc57777.2023.10422605","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422605","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.03774","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055443993","display_name":"Johannes Fischer","orcid":"https://orcid.org/0000-0002-3384-597X"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Johannes Fischer","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]},{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011559098","display_name":"Marlon Steiner","orcid":"https://orcid.org/0009-0005-4025-9142"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marlon Steiner","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]},{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061681603","display_name":"\u00d6mer \u015eahin Ta\u015f","orcid":"https://orcid.org/0000-0002-1249-260X"},"institutions":[{"id":"https://openalex.org/I143379178","display_name":"FZI Research Center for Information Technology","ror":"https://ror.org/04kdh6x72","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I143379178"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"\u00d6mer \u015eahin Ta\u015f","raw_affiliation_strings":["FZI Research Center for Information Technology,Karlsruhe,Germany","FZI Research Center for Information Technology, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"FZI Research Center for Information Technology,Karlsruhe,Germany","institution_ids":["https://openalex.org/I143379178"]},{"raw_affiliation_string":"FZI Research Center for Information Technology, Karlsruhe, Germany","institution_ids":["https://openalex.org/I143379178"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091574711","display_name":"Christoph Stiller","orcid":"https://orcid.org/0000-0003-4165-2075"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christoph Stiller","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]},{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055443993"],"corresponding_institution_ids":["https://openalex.org/I102335020"],"apc_list":null,"apc_paid":null,"fwci":0.558,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68551695,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2811","last_page":"2818"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.8449923992156982},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8220345973968506},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.602378249168396},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5455259680747986},{"id":"https://openalex.org/keywords/motion-control","display_name":"Motion control","score":0.533906102180481},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5193946957588196},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4937938153743744},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4457533657550812},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.40667372941970825},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.386574387550354},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35656702518463135},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.24904930591583252},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.18327397108078003}],"concepts":[{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.8449923992156982},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8220345973968506},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.602378249168396},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5455259680747986},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.533906102180481},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5193946957588196},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4937938153743744},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4457533657550812},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.40667372941970825},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.386574387550354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35656702518463135},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.24904930591583252},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.18327397108078003},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/itsc57777.2023.10422605","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422605","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2512.03774","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.03774","pdf_url":"https://arxiv.org/pdf/2512.03774","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.03774","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.03774","pdf_url":"https://arxiv.org/pdf/2512.03774","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.4300000071525574,"id":"https://metadata.un.org/sdg/13","display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391768741.pdf"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1568248713","https://openalex.org/W1845972764","https://openalex.org/W2006859604","https://openalex.org/W2088532626","https://openalex.org/W2217407546","https://openalex.org/W2396317032","https://openalex.org/W2616635592","https://openalex.org/W2736601468","https://openalex.org/W2738778707","https://openalex.org/W2769646558","https://openalex.org/W2782695576","https://openalex.org/W2791704483","https://openalex.org/W2889731659","https://openalex.org/W2897867013","https://openalex.org/W2910912045","https://openalex.org/W2963105220","https://openalex.org/W2970080264","https://openalex.org/W2972868310","https://openalex.org/W3011964880","https://openalex.org/W3049171653","https://openalex.org/W3101798601","https://openalex.org/W3101813639","https://openalex.org/W3120475579","https://openalex.org/W3164473225","https://openalex.org/W3179660843","https://openalex.org/W3193319380","https://openalex.org/W3197085773","https://openalex.org/W3199664591","https://openalex.org/W4205300464","https://openalex.org/W4206497039","https://openalex.org/W4221144246","https://openalex.org/W4293545785","https://openalex.org/W4297781990","https://openalex.org/W4308080966","https://openalex.org/W4311416708","https://openalex.org/W4313014766","https://openalex.org/W4390939851","https://openalex.org/W6701090783","https://openalex.org/W6743333067","https://openalex.org/W6804655846"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W1987513656","https://openalex.org/W2072376847","https://openalex.org/W2089013912","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Model":[0],"predictive":[1],"control":[2,25],"(MPC)":[3],"is":[4],"widely":[5],"used":[6],"for":[7,28],"motion":[8],"planning,":[9],"particularly":[10],"in":[11,98,138,154],"autonomous":[12],"driving.":[13],"Real-time":[14],"capability":[15],"of":[16,23,81,146,156],"the":[17,29,35,44,72,78,82,109,128,133,144],"planner":[18],"requires":[19],"utilizing":[20],"convex":[21],"approximation":[22],"optimal":[24],"problems":[26],"(OCPs)":[27],"planner.":[30],"However,":[31],"such":[32],"approximations":[33],"confine":[34],"solution":[36],"to":[37,57,95,112,131],"a":[38,59,69,102,121,139],"subspace,":[39],"which":[40],"might":[41],"not":[42],"contain":[43],"global":[45,87],"optimum.":[46],"To":[47],"address":[48],"this,":[49],"we":[50,142],"propose":[51],"using":[52,101],"safe":[53,62,114,129],"reinforcement":[54,92],"learning":[55,93],"(SRL)":[56],"obtain":[58],"new":[60],"and":[61,115,152,158],"reference":[63],"trajectory":[64],"within":[65],"MPC.":[66],"By":[67],"employing":[68],"learning-based":[70],"approach,":[71],"MPC":[73,151],"can":[74],"explore":[75],"solutions":[76],"beyond":[77],"close":[79],"neighborhood":[80],"previous":[83],"one,":[84],"potentially":[85],"finding":[86],"optima.":[88],"We":[89],"incorporate":[90],"constrained":[91],"(CRL)":[94],"ensure":[96],"safety":[97,106,157],"automated":[99],"driving,":[100],"handcrafted":[103],"energy":[104],"function-based":[105],"index":[107],"as":[108],"constraint":[110],"objective":[111],"model":[113],"unsafe":[116],"regions.":[117],"Our":[118],"approach":[119,148],"utilizes":[120],"state-dependent":[122],"Lagrangian":[123],"multiplier,":[124],"learned":[125],"concurrently":[126],"with":[127],"policy,":[130],"solve":[132],"CRL":[134],"problem.":[135],"Through":[136],"experimentation":[137],"highway":[140],"scenario,":[141],"demonstrate":[143],"superiority":[145],"our":[147],"over":[149],"both":[150],"SRL":[153],"terms":[155],"performance":[159],"measures.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2024-02-14T00:00:00"}
