{"id":"https://openalex.org/W4400645643","doi":"https://doi.org/10.1109/iv55156.2024.10588652","title":"Test-Driven Inverse Reinforcement Learning Using Scenario-Based Testing","display_name":"Test-Driven Inverse Reinforcement Learning Using Scenario-Based Testing","publication_year":2024,"publication_date":"2024-06-02","ids":{"openalex":"https://openalex.org/W4400645643","doi":"https://doi.org/10.1109/iv55156.2024.10588652"},"language":"en","primary_location":{"id":"doi:10.1109/iv55156.2024.10588652","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iv55156.2024.10588652","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055443993","display_name":"Johannes Fischer","orcid":"https://orcid.org/0000-0002-3384-597X"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Johannes Fischer","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027250190","display_name":"Moritz Werling","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156768","display_name":"BMW Group (Germany)","ror":"https://ror.org/044kkbh92","country_code":"DE","type":"company","lineage":["https://openalex.org/I4210156768"]},{"id":"https://openalex.org/I4210145546","display_name":"Baxter (Germany)","ror":"https://ror.org/05jgtkc28","country_code":"DE","type":"company","lineage":["https://openalex.org/I4210145546","https://openalex.org/I99484792"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Moritz Werling","raw_affiliation_strings":["BMWGroup,Unterschleissheim,Germany"],"affiliations":[{"raw_affiliation_string":"BMWGroup,Unterschleissheim,Germany","institution_ids":["https://openalex.org/I4210145546","https://openalex.org/I4210156768"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008189468","display_name":"Martin Lauer","orcid":"https://orcid.org/0000-0003-4414-5722"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Lauer","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091574711","display_name":"Christoph Stiller","orcid":"https://orcid.org/0000-0003-4165-2075"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christoph Stiller","raw_affiliation_strings":["Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055443993"],"corresponding_institution_ids":["https://openalex.org/I102335020"],"apc_list":null,"apc_paid":null,"fwci":0.3637,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.64548585,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"827","last_page":"834"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9006999731063843,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6830347776412964},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6370288133621216},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.5933738946914673},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.47698527574539185},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4331055283546448},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38037070631980896},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13886383175849915},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.07433217763900757}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6830347776412964},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6370288133621216},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.5933738946914673},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.47698527574539185},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4331055283546448},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38037070631980896},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13886383175849915},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.07433217763900757},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iv55156.2024.10588652","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iv55156.2024.10588652","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W316935178","https://openalex.org/W1424654272","https://openalex.org/W1583837637","https://openalex.org/W1594223874","https://openalex.org/W1995780830","https://openalex.org/W2073787051","https://openalex.org/W2135194391","https://openalex.org/W2156163138","https://openalex.org/W2471883051","https://openalex.org/W2492076227","https://openalex.org/W2735318784","https://openalex.org/W2842089854","https://openalex.org/W2913210897","https://openalex.org/W2914933231","https://openalex.org/W2964177756","https://openalex.org/W2980087597","https://openalex.org/W3003474222","https://openalex.org/W3039563104","https://openalex.org/W3118900686","https://openalex.org/W3193319380","https://openalex.org/W3205292576","https://openalex.org/W3210651683","https://openalex.org/W4212774754","https://openalex.org/W4282981328","https://openalex.org/W4297781990","https://openalex.org/W4383108453","https://openalex.org/W6635261211","https://openalex.org/W6674884181","https://openalex.org/W6696273291","https://openalex.org/W6746419623","https://openalex.org/W6749138962","https://openalex.org/W6768870957","https://openalex.org/W6771598146","https://openalex.org/W6781315541","https://openalex.org/W6811052944"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Automated":[0],"vehicles":[1],"require":[2],"carefully":[3],"designed":[4],"cost":[5,32,99,117,132,157,166],"functions,":[6,33],"which":[7,40],"are":[8,41,152],"challenging":[9],"to":[10,13,21,43,97,115,154],"specify":[11],"due":[12],"the":[14,17,69,90,122,130,165],"complexity":[15],"of":[16,56,92],"behavior":[18],"they":[19],"need":[20,70],"cover.":[22],"Inverse":[23,82],"reinforcement":[24],"learning":[25],"is":[26],"a":[27,51,64,173],"principled":[28],"methodology":[29,66],"for":[30,54,71,178],"deriving":[31],"but":[34,170],"it":[35],"requires":[36],"high-quality":[37],"expert":[38,73],"demonstrations,":[39],"expensive":[42],"obtain.":[44],"Recently,":[45],"scenario-based":[46,78],"testing":[47],"has":[48],"emerged":[49],"as":[50,95],"promising":[52],"approach":[53,85],"validation":[55,144],"driving":[57,74,181],"behavior.":[58],"In":[59],"this":[60],"paper,":[61],"we":[62],"introduce":[63],"novel":[65],"that":[67,119,129,148],"circumvents":[68],"costly":[72],"demonstrations":[75],"by":[76,136],"harnessing":[77],"testing.":[79],"Our":[80],"Test-Driven":[81],"Reinforcement":[83],"Learning":[84],"leverages":[86],"Bayesian":[87],"inference,":[88],"utilizing":[89],"outcomes":[91],"scenario":[93,124,139,150],"tests":[94,140,151],"observations":[96],"infer":[98],"functions.":[100,158],"We":[101,126],"rigorously":[102],"evaluate":[103],"our":[104],"method":[105],"on":[106],"simulated":[107],"and":[108,111,146,175],"real-world":[109],"scenarios":[110],"demonstrate":[112],"its":[113],"ability":[114],"learn":[116,155],"functions":[118],"successfully":[120],"pass":[121],"respective":[123],"tests.":[125],"also":[127,137,171],"show":[128],"learned":[131],"function":[133,167],"generalizes":[134],"well":[135],"passing":[138],"from":[141],"an":[142],"unseen":[143],"set":[145],"illustrate":[147],"few":[149],"sufficient":[153],"meaningful":[156],"This":[159],"innovative":[160],"framework":[161],"not":[162],"only":[163],"streamlines":[164],"specification":[168],"process":[169],"offers":[172],"cost-effective":[174],"practical":[176],"solution":[177],"advancing":[179],"automated":[180],"systems.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
