{"id":"https://openalex.org/W4285601900","doi":"https://doi.org/10.24963/ijcai.2022/72","title":"Search-Based Testing of Reinforcement Learning","display_name":"Search-Based Testing of Reinforcement Learning","publication_year":2022,"publication_date":"2022-07-01","ids":{"openalex":"https://openalex.org/W4285601900","doi":"https://doi.org/10.24963/ijcai.2022/72"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2022/72","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/72","pdf_url":"https://www.ijcai.org/proceedings/2022/0072.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.ijcai.org/proceedings/2022/0072.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078635542","display_name":"Martin Tappler","orcid":"https://orcid.org/0000-0002-4193-5609"},"institutions":[{"id":"https://openalex.org/I4210123126","display_name":"Silicon Austria Labs (Austria)","ror":"https://ror.org/03b1qgn79","country_code":"AT","type":"company","lineage":["https://openalex.org/I4210123126"]},{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["AT","CN"],"is_corresponding":true,"raw_author_name":"Martin Tappler","raw_affiliation_strings":["Institute of Software Technology, Graz University of Technology","TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","Institute of Software Technology, Graz University of Technology; TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software Technology, Graz University of Technology","institution_ids":["https://openalex.org/I4092182","https://openalex.org/I4210128818"]},{"raw_affiliation_string":"TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","institution_ids":["https://openalex.org/I4210123126","https://openalex.org/I4092182"]},{"raw_affiliation_string":"Institute of Software Technology, Graz University of Technology; TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","institution_ids":["https://openalex.org/I4210123126","https://openalex.org/I4092182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003307281","display_name":"Filip Cano C\u00f3rdoba","orcid":null},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Filip Cano C\u00f3rdoba","raw_affiliation_strings":["Institute of Applied Information Processing and Communications, Graz University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Applied Information Processing and Communications, Graz University of Technology","institution_ids":["https://openalex.org/I4092182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009450062","display_name":"Bernhard K. Aichernig","orcid":"https://orcid.org/0000-0002-3484-5584"},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I4210123126","display_name":"Silicon Austria Labs (Austria)","ror":"https://ror.org/03b1qgn79","country_code":"AT","type":"company","lineage":["https://openalex.org/I4210123126"]},{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT","CN"],"is_corresponding":false,"raw_author_name":"Bernhard K. Aichernig","raw_affiliation_strings":["Institute of Software Technology, Graz University of Technology","TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","Institute of Software Technology, Graz University of Technology; TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software Technology, Graz University of Technology","institution_ids":["https://openalex.org/I4092182","https://openalex.org/I4210128818"]},{"raw_affiliation_string":"TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","institution_ids":["https://openalex.org/I4210123126","https://openalex.org/I4092182"]},{"raw_affiliation_string":"Institute of Software Technology, Graz University of Technology; TU Graz-SAL DES Lab,Silicon Austria Labs, Graz, Austria","institution_ids":["https://openalex.org/I4210123126","https://openalex.org/I4092182"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042655793","display_name":"Bettina K\u00f6nighofer","orcid":"https://orcid.org/0000-0001-5183-5452"},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Bettina K\u00f6nighofer","raw_affiliation_strings":["Institute of Applied Information Processing and Communications, Graz University of Technology","Lamarr Security Research","Institute of Applied Information Processing and Communications, Graz University of Technology; Lamarr Security Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Applied Information Processing and Communications, Graz University of Technology","institution_ids":["https://openalex.org/I4092182"]},{"raw_affiliation_string":"Lamarr Security Research","institution_ids":[]},{"raw_affiliation_string":"Institute of Applied Information Processing and Communications, Graz University of Technology; Lamarr Security Research","institution_ids":["https://openalex.org/I4092182"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5078635542"],"corresponding_institution_ids":["https://openalex.org/I4092182","https://openalex.org/I4210123126","https://openalex.org/I4210128818"],"apc_list":null,"apc_paid":null,"fwci":2.4934,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.9109992,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"503","last_page":"510"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.9824000000953674,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.848629355430603},{"id":"https://openalex.org/keywords/fuzz-testing","display_name":"Fuzz testing","score":0.8173365592956543},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.768873929977417},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5886972546577454},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.5584118962287903},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.546563982963562},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.538598358631134},{"id":"https://openalex.org/keywords/backtracking","display_name":"Backtracking","score":0.5154550671577454},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5001335144042969},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45115602016448975},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.4416605532169342},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.1709733009338379},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13316544890403748},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10960763692855835},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10006481409072876}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.848629355430603},{"id":"https://openalex.org/C111065885","wikidata":"https://www.wikidata.org/wiki/Q1189053","display_name":"Fuzz testing","level":3,"score":0.8173365592956543},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.768873929977417},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5886972546577454},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.5584118962287903},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.546563982963562},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.538598358631134},{"id":"https://openalex.org/C156884757","wikidata":"https://www.wikidata.org/wiki/Q798554","display_name":"Backtracking","level":2,"score":0.5154550671577454},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5001335144042969},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45115602016448975},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.4416605532169342},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.1709733009338379},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13316544890403748},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10960763692855835},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10006481409072876},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2022/72","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/72","pdf_url":"https://www.ijcai.org/proceedings/2022/0072.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2022/72","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/72","pdf_url":"https://www.ijcai.org/proceedings/2022/0072.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G1364539167","display_name":"FOUNDATIONS FOR CONTINUOUS ENGINEERING OF TRUSTWORTHY AUTONOMY","funder_award_id":"956123","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7842005466","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320310430","display_name":"TU Graz, Internationale Beziehungen und Mobilit\u00e4tsprogramme","ror":"https://ror.org/00d7xrm67"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4285601900.pdf","grobid_xml":"https://content.openalex.org/works/W4285601900.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1524053243","https://openalex.org/W1845972764","https://openalex.org/W2115668428","https://openalex.org/W2138076011","https://openalex.org/W2150468603","https://openalex.org/W2257979135","https://openalex.org/W2744647809","https://openalex.org/W2751422670","https://openalex.org/W2753704268","https://openalex.org/W2781585732","https://openalex.org/W2804337238","https://openalex.org/W2885847999","https://openalex.org/W2888307014","https://openalex.org/W2963054787","https://openalex.org/W2963064278","https://openalex.org/W2963575966","https://openalex.org/W2989847975","https://openalex.org/W2994987245","https://openalex.org/W3003533476","https://openalex.org/W3037871539","https://openalex.org/W3046946156","https://openalex.org/W3091816902","https://openalex.org/W3099444373","https://openalex.org/W3100935330","https://openalex.org/W3103780890","https://openalex.org/W3118210634","https://openalex.org/W3127561923","https://openalex.org/W3185656037","https://openalex.org/W3194351501","https://openalex.org/W3197485521","https://openalex.org/W3208566226","https://openalex.org/W3213434944","https://openalex.org/W4214717370","https://openalex.org/W4287018575","https://openalex.org/W4394666657","https://openalex.org/W6791858558","https://openalex.org/W6864014924"],"related_works":["https://openalex.org/W2511770387","https://openalex.org/W3120811337","https://openalex.org/W2766647240","https://openalex.org/W4385301282","https://openalex.org/W2990186179","https://openalex.org/W3203597304","https://openalex.org/W4248424560","https://openalex.org/W4210660460","https://openalex.org/W3119380829","https://openalex.org/W4288084466"],"abstract_inverted_index":{"Evaluation":[0],"of":[1,12,19,28,44,54,81,117,135,144,153],"deep":[2,29,55],"reinforcement":[3],"learning":[4],"(RL)":[5],"is":[6,147],"inherently":[7],"challenging.":[8],"Especially":[9],"the":[10,16,26,50,75,82,98,129,141,145,150,154],"opaqueness":[11],"learned":[13],"policies":[14],"and":[15,22,52],"stochastic":[17],"nature":[18],"both":[20],"agents":[21,31],"environments":[23],"make":[24],"testing":[25,37,161],"behavior":[27],"RL":[30,56,76,99,164],"difficult.":[32],"We":[33,90,157],"present":[34],"a":[35,41,64,70,114,132],"search-based":[36,160],"framework":[38,62],"that":[39,67,73,94],"enables":[40],"wide":[42,133],"range":[43],"novel":[45],"analysis":[46],"capabilities":[47],"for":[48,69,165],"evaluating":[49],"safety":[51,59,92],"performance":[53,110,143,152],"agents.":[57],"For":[58,108],"testing,":[60,111],"our":[61,159],"utilizes":[63],"search":[65],"algorithm":[66],"searches":[68],"reference":[71],"trace":[72],"solves":[74],"task.":[77],"The":[78],"backtracking":[79],"states":[80,138],"search,":[83],"called":[84],"boundary":[85,106],"states,":[86],"pose":[87],"safety-critical":[88,102],"situations.":[89],"create":[91,113],"test-suites":[93],"evaluate":[95],"how":[96],"well":[97],"agent":[100,130,146],"escapes":[101],"situations":[103],"near":[104],"these":[105],"states.":[107],"robust":[109],"we":[112],"diverse":[115],"set":[116],"traces":[118,124],"via":[119],"fuzz":[120,123,155],"testing.":[121],"These":[122],"are":[125],"used":[126],"to":[127,149],"bring":[128],"into":[131],"variety":[134],"potentially":[136],"unknown":[137],"from":[139],"which":[140],"average":[142,151],"compared":[148],"traces.":[156],"apply":[158],"approach":[162],"on":[163],"Nintendo's":[166],"Super":[167],"Mario":[168],"Bros.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":2}],"updated_date":"2026-05-19T08:33:51.333923","created_date":"2025-10-10T00:00:00"}
