{"id":"https://openalex.org/W4391871279","doi":"https://doi.org/10.1109/tiv.2024.3400597","title":"Provable Traffic Rule Compliance in Safe Reinforcement Learning on the Open Sea","display_name":"Provable Traffic Rule Compliance in Safe Reinforcement Learning on the Open Sea","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4391871279","doi":"https://doi.org/10.1109/tiv.2024.3400597"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2024.3400597","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3400597","pdf_url":"https://ieeexplore.ieee.org/ielx7/7274857/7448921/10530091.pdf","source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/7274857/7448921/10530091.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065905965","display_name":"Hanna Krasowski","orcid":"https://orcid.org/0000-0002-6730-3802"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Hanna Krasowski","raw_affiliation_strings":["Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005383495","display_name":"Matthias Althoff","orcid":"https://orcid.org/0000-0003-3733-842X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Althoff","raw_affiliation_strings":["Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5065905965"],"corresponding_institution_ids":["https://openalex.org/I62916508"],"apc_list":null,"apc_paid":null,"fwci":1.3165,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.7689079,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"9","issue":"12","first_page":"7617","last_page":"7634"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11622","display_name":"Maritime Navigation and Safety","score":0.9257000088691711,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11622","display_name":"Maritime Navigation and Safety","score":0.9257000088691711,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7355509400367737},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7161069512367249},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6259419918060303},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5735130310058594},{"id":"https://openalex.org/keywords/autonomous-agent","display_name":"Autonomous agent","score":0.41260552406311035},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40463632345199585},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.35063546895980835},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.16057711839675903},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13467463850975037},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0817006528377533}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7355509400367737},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7161069512367249},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6259419918060303},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5735130310058594},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.41260552406311035},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40463632345199585},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.35063546895980835},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.16057711839675903},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13467463850975037},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0817006528377533}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tiv.2024.3400597","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3400597","pdf_url":"https://ieeexplore.ieee.org/ielx7/7274857/7448921/10530091.pdf","source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2402.08502","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.08502","pdf_url":"https://arxiv.org/pdf/2402.08502","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:mediatum.ub.tum.de:node/1743072","is_oa":true,"landing_page_url":"https://mediatum.ub.tum.de/1743072","pdf_url":null,"source":{"id":"https://openalex.org/S4377196330","display_name":"mediaTUM  (Technical University of Munich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I62916508","host_organization_name":"Technical University of Munich","host_organization_lineage":["https://openalex.org/I62916508"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/tiv.2024.3400597","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3400597","pdf_url":"https://ieeexplore.ieee.org/ielx7/7274857/7448921/10530091.pdf","source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","display_name":"Life below water","score":0.6700000166893005}],"awards":[{"id":"https://openalex.org/G2398295961","display_name":null,"funder_award_id":"GRK 2428","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391871279.pdf"},"referenced_works_count":67,"referenced_works":["https://openalex.org/W2002440441","https://openalex.org/W2042225474","https://openalex.org/W2074547849","https://openalex.org/W2086124410","https://openalex.org/W2139289091","https://openalex.org/W2317713946","https://openalex.org/W2484617215","https://openalex.org/W2492811885","https://openalex.org/W2560882727","https://openalex.org/W2617376550","https://openalex.org/W2737479107","https://openalex.org/W2787908307","https://openalex.org/W2789862859","https://openalex.org/W2790472381","https://openalex.org/W2904263972","https://openalex.org/W2912757393","https://openalex.org/W2954211265","https://openalex.org/W2962702177","https://openalex.org/W2963575966","https://openalex.org/W2967516159","https://openalex.org/W2968120782","https://openalex.org/W2969218722","https://openalex.org/W2974556546","https://openalex.org/W2979089101","https://openalex.org/W2995074243","https://openalex.org/W2999840070","https://openalex.org/W3025711725","https://openalex.org/W3038904154","https://openalex.org/W3065468121","https://openalex.org/W3083914918","https://openalex.org/W3090211586","https://openalex.org/W3093055384","https://openalex.org/W3115737827","https://openalex.org/W3121030992","https://openalex.org/W3127561923","https://openalex.org/W3149053487","https://openalex.org/W3168204680","https://openalex.org/W3173679721","https://openalex.org/W3174398482","https://openalex.org/W3195604129","https://openalex.org/W3206041612","https://openalex.org/W3206889533","https://openalex.org/W3207668814","https://openalex.org/W3210162825","https://openalex.org/W3210290940","https://openalex.org/W3215237054","https://openalex.org/W3215910331","https://openalex.org/W4205368732","https://openalex.org/W4225615381","https://openalex.org/W4303712138","https://openalex.org/W4308080454","https://openalex.org/W4308080772","https://openalex.org/W4312532193","https://openalex.org/W4312726780","https://openalex.org/W4312788366","https://openalex.org/W4324116431","https://openalex.org/W4360868502","https://openalex.org/W4362672763","https://openalex.org/W4382119883","https://openalex.org/W4383112775","https://openalex.org/W4386615302","https://openalex.org/W4388919353","https://openalex.org/W4392030711","https://openalex.org/W6741002519","https://openalex.org/W6743558609","https://openalex.org/W6804601995","https://openalex.org/W6838633502"],"related_works":["https://openalex.org/W2770234245","https://openalex.org/W96612179","https://openalex.org/W4229499248","https://openalex.org/W2566006169","https://openalex.org/W1567818861","https://openalex.org/W2987774938","https://openalex.org/W4256492088","https://openalex.org/W632915154","https://openalex.org/W4206233823","https://openalex.org/W2494202692"],"abstract_inverted_index":{"For":[0],"safe":[1],"operation,":[2],"autonomous":[3,61],"vehicles":[4],"have":[5],"to":[6,27,43,56,106,148],"obey":[7],"traffic":[8,30,78,161,189,195],"rules":[9,35,137,171,196],"that":[10,40],"are":[11,41,67],"set":[12,150],"forth":[13],"in":[14,18,38],"legal":[15,170],"documents":[16],"formulated":[17],"natural":[19],"language.":[20],"Temporal":[21],"logic":[22,34,88],"is":[23,52],"a":[24,53,132,177],"suitable":[25],"concept":[26],"formalize":[28],"such":[29],"rules.":[31,79],"Still,":[32],"temporal":[33,87],"often":[36],"result":[37],"constraints":[39],"hard":[42],"solve":[44],"using":[45],"optimization-based":[46],"motion":[47,58],"planners.":[48],"Reinforcement":[49],"learning":[50],"(RL)":[51],"promising":[54],"method":[55],"find":[57],"plans":[59],"for":[60,113],"vehicles.":[62],"However,":[63],"vanilla":[64,187],"RL":[65,146,191],"algorithms":[66],"based":[68,127],"on":[69,99,109,128,158],"random":[70],"exploration":[71],"and":[72,138,172,183,188,197],"do":[73],"not":[74],"automatically":[75],"comply":[76],"with":[77,131,167],"Our":[80],"approach":[81],"accomplishes":[82],"guaranteed":[83],"rule-compliance":[84],"by":[85],"integrating":[86],"specifications":[89],"into":[90],"RL.":[91],"Specifically,":[92],"we":[93,124],"consider":[94],"the":[95,100,107,110,145,168],"application":[96],"of":[97,151],"vessels":[98],"open":[101],"sea,":[102],"which":[103],"must":[104],"adhere":[105],"Convention":[108],"International":[111],"Regulations":[112],"Preventing":[114],"Collisions":[115],"at":[116],"Sea":[117],"(COLREGS).":[118],"To":[119],"efficiently":[120],"synthesize":[121],"rule-compliant":[122,153],"actions,":[123],"combine":[125],"predicates":[126],"set-based":[129],"prediction":[130],"statechart":[133],"representing":[134],"our":[135,163],"formalized":[136,169],"their":[139],"priorities.":[140],"Action":[141],"masking":[142],"then":[143],"restricts":[144],"agent":[147,164],"this":[149],"verified":[152],"actions.":[154],"In":[155,185],"numerical":[156],"evaluations":[157],"critical":[159],"maritime":[160],"situations,":[162],"always":[165],"complies":[166],"never":[173],"collides":[174],"while":[175],"achieving":[176],"high":[178],"goal-reaching":[179],"rate":[180],"during":[181],"training":[182],"deployment.":[184],"contrast,":[186],"rule-informed":[190],"agents":[192],"frequently":[193],"violate":[194],"collide":[198],"even":[199],"after":[200],"training.":[201]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
