{"id":"https://openalex.org/W3178194471","doi":"https://doi.org/10.1109/itsc48978.2021.9564898","title":"CommonRoad-RL: A Configurable Reinforcement Learning Environment for Motion Planning of Autonomous Vehicles","display_name":"CommonRoad-RL: A Configurable Reinforcement Learning Environment for Motion Planning of Autonomous Vehicles","publication_year":2021,"publication_date":"2021-09-19","ids":{"openalex":"https://openalex.org/W3178194471","doi":"https://doi.org/10.1109/itsc48978.2021.9564898","mag":"3178194471"},"language":"en","primary_location":{"id":"doi:10.1109/itsc48978.2021.9564898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc48978.2021.9564898","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Intelligent Transportation Systems Conference (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://mediatum.ub.tum.de/1616584","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101465691","display_name":"Xiao Wang","orcid":"https://orcid.org/0000-0003-4441-139X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Xiao Wang","raw_affiliation_strings":["Department of Informatics, Technical University of Munich, Garching, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Technical University of Munich, Garching, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065905965","display_name":"Hanna Krasowski","orcid":"https://orcid.org/0000-0002-6730-3802"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Hanna Krasowski","raw_affiliation_strings":["Department of Informatics, Technical University of Munich, Garching, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Technical University of Munich, Garching, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005383495","display_name":"Matthias Althoff","orcid":"https://orcid.org/0000-0003-3733-842X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Althoff","raw_affiliation_strings":["Department of Informatics, Technical University of Munich, Garching, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Technical University of Munich, Garching, Germany","institution_ids":["https://openalex.org/I62916508"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101465691"],"corresponding_institution_ids":["https://openalex.org/I62916508"],"apc_list":null,"apc_paid":null,"fwci":2.405,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.88353632,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"466","last_page":"472"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9696999788284302,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9086006283760071},{"id":"https://openalex.org/keywords/toolbox","display_name":"Toolbox","score":0.8768549561500549},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7574074864387512},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7161232233047485},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6943166255950928},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.6134694814682007},{"id":"https://openalex.org/keywords/modularity","display_name":"Modularity (biology)","score":0.5847804546356201},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.581454873085022},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5373664498329163},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5119789838790894},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.48053938150405884},{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.4492378532886505},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4172170162200928},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38855642080307007},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.37165650725364685},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.3190242052078247},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.1768096685409546}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9086006283760071},{"id":"https://openalex.org/C2777655017","wikidata":"https://www.wikidata.org/wiki/Q1501161","display_name":"Toolbox","level":2,"score":0.8768549561500549},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7574074864387512},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7161232233047485},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6943166255950928},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.6134694814682007},{"id":"https://openalex.org/C2779478453","wikidata":"https://www.wikidata.org/wiki/Q6889748","display_name":"Modularity (biology)","level":2,"score":0.5847804546356201},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.581454873085022},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5373664498329163},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5119789838790894},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.48053938150405884},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.4492378532886505},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4172170162200928},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38855642080307007},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.37165650725364685},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.3190242052078247},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.1768096685409546},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/itsc48978.2021.9564898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc48978.2021.9564898","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Intelligent Transportation Systems Conference (ITSC)","raw_type":"proceedings-article"},{"id":"pmh:oai:mediatum.ub.tum.de:node/1616584","is_oa":true,"landing_page_url":"https://mediatum.ub.tum.de/1616584","pdf_url":null,"source":{"id":"https://openalex.org/S4377196330","display_name":"mediaTUM  (Technical University of Munich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I62916508","host_organization_name":"Technical University of Munich","host_organization_lineage":["https://openalex.org/I62916508"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"ConferencePaper"}],"best_oa_location":{"id":"pmh:oai:mediatum.ub.tum.de:node/1616584","is_oa":true,"landing_page_url":"https://mediatum.ub.tum.de/1616584","pdf_url":null,"source":{"id":"https://openalex.org/S4377196330","display_name":"mediaTUM  (Technical University of Munich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I62916508","host_organization_name":"Technical University of Munich","host_organization_lineage":["https://openalex.org/I62916508"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"ConferencePaper"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1558979968","https://openalex.org/W1989750313","https://openalex.org/W2120660345","https://openalex.org/W2520190918","https://openalex.org/W2561466143","https://openalex.org/W2727840223","https://openalex.org/W2736601468","https://openalex.org/W2740508249","https://openalex.org/W2896030454","https://openalex.org/W2896642734","https://openalex.org/W2903709398","https://openalex.org/W2905509562","https://openalex.org/W2910975058","https://openalex.org/W2952922765","https://openalex.org/W2962867954","https://openalex.org/W2980087597","https://openalex.org/W3090027660","https://openalex.org/W3112522408","https://openalex.org/W3115241155","https://openalex.org/W3115737827","https://openalex.org/W3116266826","https://openalex.org/W3117054268","https://openalex.org/W3117956005","https://openalex.org/W3118240751","https://openalex.org/W3132059329","https://openalex.org/W3201148029","https://openalex.org/W4285719527","https://openalex.org/W4295719664","https://openalex.org/W6726431988","https://openalex.org/W6741002519","https://openalex.org/W6745935785","https://openalex.org/W6764773821","https://openalex.org/W6769782826","https://openalex.org/W6774427560","https://openalex.org/W6780559895","https://openalex.org/W6781266601","https://openalex.org/W6787286649","https://openalex.org/W6787983614","https://openalex.org/W6788229631","https://openalex.org/W6791110036","https://openalex.org/W6801850594"],"related_works":["https://openalex.org/W2096013579","https://openalex.org/W1589140671","https://openalex.org/W1760611253","https://openalex.org/W52153049","https://openalex.org/W2951545791","https://openalex.org/W1515117609","https://openalex.org/W2294884454","https://openalex.org/W4323315247","https://openalex.org/W3169161914","https://openalex.org/W4321379664"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1],"(RL)":[2],"methods":[3],"have":[4],"gained":[5],"popularity":[6],"in":[7,20],"the":[8,36],"field":[9],"of":[10,64],"motion":[11,55],"planning":[12],"for":[13,57],"autonomous":[14,58],"vehicles":[15],"due":[16],"to":[17,31,50],"their":[18],"success":[19],"robotics":[21],"and":[22,52,62,82],"computer":[23],"games.":[24],"However,":[25],"no":[26],"existing":[27],"work":[28],"enables":[29],"researchers":[30],"conveniently":[32],"compare":[33],"different":[34,68,78],"underlying":[35],"Markov":[37],"decision":[38],"processes":[39],"(MDPs).":[40],"To":[41],"address":[42],"this":[43],"issue,":[44],"we":[45],"present":[46],"CommonRoad-RL-an":[47],"open-source":[48],"toolbox":[49,91],"train":[51],"evaluate":[53],"RL-based":[54],"planners":[56],"vehicles.":[59],"Configurability,":[60],"modularity,":[61],"stability":[63],"CommonRoad-RL":[65],"simplify":[66],"comparing":[67,74],"MDPs.":[69],"This":[70],"is":[71,92],"demonstrated":[72],"by":[73],"agents":[75],"trained":[76],"with":[77],"rewards,":[79],"action":[80],"spaces,":[81],"vehicle":[83],"models":[84],"on":[85],"a":[86],"real-world":[87],"highway":[88],"dataset.":[89],"Our":[90],"available":[93],"at":[94],"commonroad.in.tum.de.":[95]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-04T09:10:02.777135","created_date":"2021-07-19T00:00:00"}
