{"id":"https://openalex.org/W4403678596","doi":"https://doi.org/10.1109/case59546.2024.10711661","title":"Safe Value Functions: Learned Critics as Hard Safety Constraints","display_name":"Safe Value Functions: Learned Critics as Hard Safety Constraints","publication_year":2024,"publication_date":"2024-08-28","ids":{"openalex":"https://openalex.org/W4403678596","doi":"https://doi.org/10.1109/case59546.2024.10711661"},"language":"en","primary_location":{"id":"doi:10.1109/case59546.2024.10711661","is_oa":false,"landing_page_url":"https://doi.org/10.1109/case59546.2024.10711661","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 20th International Conference on Automation Science and Engineering (CASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://discovery.ucl.ac.uk/10201038/1/C49.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058173109","display_name":"Daniel C. H. Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Daniel C.H. Tan","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101403836","display_name":"Robert McCarthy","orcid":"https://orcid.org/0000-0002-2140-6988"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robert McCarthy","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079915517","display_name":"Fernando Acero","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Fernando Acero","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093900200","display_name":"Andromachi Maria Delfaki","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andromachi Maria Delfaki","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100351560","display_name":"Zhibin Li","orcid":"https://orcid.org/0000-0002-6357-7419"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhibin Li","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048122691","display_name":"Dimitrios Kanoulas","orcid":"https://orcid.org/0000-0002-3684-1472"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Dimitrios Kanoulas","raw_affiliation_strings":["University College London,Department of Computer Science,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5058173109"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":null,"apc_paid":null,"fwci":1.1184,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.84125933,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2441","last_page":"2448"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11573","display_name":"Risk Perception and Management","score":0.2240999937057495,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11573","display_name":"Risk Perception and Management","score":0.2240999937057495,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10809","display_name":"Occupational Health and Safety Research","score":0.2037999927997589,"subfield":{"id":"https://openalex.org/subfields/3614","display_name":"Radiological and Ultrasound Technology"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11810","display_name":"Complex Systems and Decision Making","score":0.19499999284744263,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.6108124256134033},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.49250373244285583},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10414868593215942}],"concepts":[{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.6108124256134033},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.49250373244285583},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10414868593215942}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/case59546.2024.10711661","is_oa":false,"landing_page_url":"https://doi.org/10.1109/case59546.2024.10711661","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 20th International Conference on Automation Science and Engineering (CASE)","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10201038","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10201038/","pdf_url":"https://discovery.ucl.ac.uk/10201038/1/C49.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  2024 IEEE 20th International Conference on Automation Science and Engineering (CASE).  (pp. pp. 2441-2448).  IEEE: Bari, Italy. (2024)","raw_type":"Proceedings paper"}],"best_oa_location":{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10201038","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10201038/","pdf_url":"https://discovery.ucl.ac.uk/10201038/1/C49.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  2024 IEEE 20th International Conference on Automation Science and Engineering (CASE).  (pp. pp. 2441-2448).  IEEE: Bari, Italy. (2024)","raw_type":"Proceedings paper"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4403678596.pdf"},"referenced_works_count":76,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1518931405","https://openalex.org/W1980569135","https://openalex.org/W2068997299","https://openalex.org/W2158782408","https://openalex.org/W2325770295","https://openalex.org/W2443711627","https://openalex.org/W2531894595","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2784465508","https://openalex.org/W2804791273","https://openalex.org/W2927638312","https://openalex.org/W2966735560","https://openalex.org/W2970795963","https://openalex.org/W2993433457","https://openalex.org/W2996975825","https://openalex.org/W2999905431","https://openalex.org/W3016525976","https://openalex.org/W3033324992","https://openalex.org/W3120475579","https://openalex.org/W3121024268","https://openalex.org/W3131411499","https://openalex.org/W3135239772","https://openalex.org/W3172360140","https://openalex.org/W3195968524","https://openalex.org/W3207110310","https://openalex.org/W4206318793","https://openalex.org/W4221161274","https://openalex.org/W4235396164","https://openalex.org/W4289709949","https://openalex.org/W4292103799","https://openalex.org/W4293545785","https://openalex.org/W4294562617","https://openalex.org/W4298857966","https://openalex.org/W4306311916","https://openalex.org/W4309800374","https://openalex.org/W4315606134","https://openalex.org/W4366458941","https://openalex.org/W4376988891","https://openalex.org/W4387447989","https://openalex.org/W6637967152","https://openalex.org/W6643032878","https://openalex.org/W6684921986","https://openalex.org/W6737893269","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6747790125","https://openalex.org/W6751535212","https://openalex.org/W6751725685","https://openalex.org/W6753691991","https://openalex.org/W6757105609","https://openalex.org/W6767277667","https://openalex.org/W6772931863","https://openalex.org/W6773002119","https://openalex.org/W6776601253","https://openalex.org/W6779265984","https://openalex.org/W6780241948","https://openalex.org/W6780559895","https://openalex.org/W6780587392","https://openalex.org/W6788898170","https://openalex.org/W6795253412","https://openalex.org/W6796589144","https://openalex.org/W6798407072","https://openalex.org/W6801006633","https://openalex.org/W6801971982","https://openalex.org/W6802092367","https://openalex.org/W6803800456","https://openalex.org/W6803914020","https://openalex.org/W6805457603","https://openalex.org/W6805807127","https://openalex.org/W6841950565","https://openalex.org/W6846345420","https://openalex.org/W6847069214","https://openalex.org/W6852522985","https://openalex.org/W6853523444"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0],"the":[1,35,92,95,103,113,128,138,150,159,195,206],"domain":[2],"of":[3,97,105,116,152,161,165,197],"safety-critical":[4,215],"applications,":[5],"there":[6],"is":[7],"a":[8,55,61,122,133,174],"pressing":[9],"need":[10],"for":[11,75,94,208],"control":[12,23,154,179,199],"methods":[13,180],"that":[14,64,83,125,181],"are":[15,182],"not":[16],"only":[17],"scalable":[18,184],"but":[19],"also":[20],"verifiable.":[21],"Traditional":[22],"strategies,":[24],"which":[25],"rely":[26],"on":[27,72,86],"certification":[28],"processes,":[29],"often":[30],"struggle":[31],"to":[32,34,120,131,141,146,185,190],"adapt":[33],"complexity":[36],"inherent":[37],"in":[38,49,149,214],"these":[39],"systems.":[40],"Conversely,":[41],"while":[42],"reinforcement":[43],"learning":[44],"(RL)":[45],"techniques":[46],"show":[47],"promise":[48],"scaling":[50],"effectively,":[51],"their":[52],"verifiability":[53],"remains":[54],"significant":[56,175],"challenge.":[57],"Our":[58,88,135],"research":[59,172],"introduces":[60],"novel":[62],"approach":[63,136],"bridges":[65],"this":[66],"gap":[67],"by":[68,167],"offering":[69],"strong":[70],"guarantees":[71],"constraint":[73],"satisfaction":[74],"general":[76],"dynamical":[77],"systems,":[78],"diverging":[79],"from":[80],"previous":[81],"works":[82],"primarily":[84],"focus":[85],"certification.":[87],"study":[89],"delves":[90],"into":[91],"prerequisites":[93],"verification":[96,164,192],"learned":[98],"Value":[99],"Functions":[100],"(VFs)":[101],"through":[102],"lens":[104],"Control":[106],"Barrier":[107],"Function":[108],"(CBF)":[109],"attributes.":[110],"We":[111],"leverage":[112],"foundational":[114],"principles":[115],"safe":[117,147],"VFs":[118,166],"(SVFs)":[119],"design":[121],"reward":[123],"mechanism":[124],"inherently":[126],"guides":[127],"optimal":[129],"VF":[130,140],"embody":[132],"CBF.":[134],"allows":[137],"resulting":[139],"restrict":[142],"subsequent":[143],"policy":[144],"actions":[145],"trajectories,":[148],"context":[151],"complex":[153,186],"problems.":[155],"Furthermore,":[156],"we":[157,204],"investigate":[158],"feasibility":[160],"conducting":[162],"formal":[163],"exploiting":[168],"CBF":[169],"properties.":[170],"This":[171],"marks":[173],"advancement":[176],"towards":[177],"achieving":[178],"both":[183],"systems":[187],"and":[188,211,219],"amenable":[189],"rigorous":[191],"processes.":[193],"Through":[194],"integration":[196],"learning-based":[198],"with":[200],"traditional":[201],"safety":[202],"guarantees,":[203],"pave":[205],"way":[207],"more":[209],"reliable":[210],"efficient":[212],"solutions":[213],"applications.":[216],"The":[217],"code":[218],"supplementary":[220],"video":[221],"can":[222],"be":[223],"found":[224],"under":[225],"our":[226],"webpage<sup":[227],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[228],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>.":[229]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
