{"id":"https://openalex.org/W4285190300","doi":"https://doi.org/10.1007/978-3-031-06773-0_10","title":"Verified Probabilistic Policies for\u00a0Deep Reinforcement Learning","display_name":"Verified Probabilistic Policies for\u00a0Deep Reinforcement Learning","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4285190300","doi":"https://doi.org/10.1007/978-3-031-06773-0_10"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-031-06773-0_10","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-06773-0_10","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.birmingham.ac.uk/en/publications/6cac3992-ce64-4986-8320-22695d114a46","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081767752","display_name":"Edoardo Bacci","orcid":"https://orcid.org/0000-0002-0367-898X"},"institutions":[{"id":"https://openalex.org/I79619799","display_name":"University of Birmingham","ror":"https://ror.org/03angcq70","country_code":"GB","type":"education","lineage":["https://openalex.org/I79619799"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Edoardo Bacci","raw_affiliation_strings":["University of Birmingham, Birmingham, UK"],"affiliations":[{"raw_affiliation_string":"University of Birmingham, Birmingham, UK","institution_ids":["https://openalex.org/I79619799"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036097359","display_name":"David Parker","orcid":"https://orcid.org/0000-0003-4137-8862"},"institutions":[{"id":"https://openalex.org/I79619799","display_name":"University of Birmingham","ror":"https://ror.org/03angcq70","country_code":"GB","type":"education","lineage":["https://openalex.org/I79619799"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"David Parker","raw_affiliation_strings":["University of Birmingham, Birmingham, UK"],"affiliations":[{"raw_affiliation_string":"University of Birmingham, Birmingham, UK","institution_ids":["https://openalex.org/I79619799"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5081767752"],"corresponding_institution_ids":["https://openalex.org/I79619799"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":5.3105,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.96158117,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"193","last_page":"212"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9735999703407288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8764429092407227},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7711215019226074},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7493160367012024},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7317680716514587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5935627818107605},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.5552864074707031},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4578913152217865},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.4515588879585266},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3905593752861023},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.34251055121421814},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3215912878513336},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08394932746887207}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8764429092407227},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7711215019226074},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7493160367012024},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7317680716514587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5935627818107605},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.5552864074707031},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4578913152217865},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.4515588879585266},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3905593752861023},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34251055121421814},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3215912878513336},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08394932746887207},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/978-3-031-06773-0_10","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-06773-0_10","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/6cac3992-ce64-4986-8320-22695d114a46","is_oa":true,"landing_page_url":"https://research.birmingham.ac.uk/en/publications/6cac3992-ce64-4986-8320-22695d114a46","pdf_url":null,"source":{"id":"https://openalex.org/S4306402634","display_name":"University of Birmingham Research Portal (University of Birmingham)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79619799","host_organization_name":"University of Birmingham","host_organization_lineage":["https://openalex.org/I79619799"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Bacci, E & Parker, D 2022, Verified probabilistic policies for deep reinforcement learning. in J V Deshmukh, K Havelund & I Perez (eds), NASA Formal Methods - 14th International Symposium, NFM 2022, Proceedings : 14th International Symposium, NFM 2022, Pasadena, CA, USA, May 24\u201327, 2022, Proceedings. vol. 13260, Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 13260 LNCS, Springer, Cham, pp. 193-212, NASA Formal Methods 2022, Pasadena, California, United States, 24/05/22. https://doi.org/10.1007/978-3-031-06773-0_10","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/6cac3992-ce64-4986-8320-22695d114a46","is_oa":true,"landing_page_url":"https://research.birmingham.ac.uk/en/publications/6cac3992-ce64-4986-8320-22695d114a46","pdf_url":null,"source":{"id":"https://openalex.org/S4306402634","display_name":"University of Birmingham Research Portal (University of Birmingham)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79619799","host_organization_name":"University of Birmingham","host_organization_lineage":["https://openalex.org/I79619799"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Bacci, E & Parker, D 2022, Verified probabilistic policies for deep reinforcement learning. in J V Deshmukh, K Havelund & I Perez (eds), NASA Formal Methods - 14th International Symposium, NFM 2022, Proceedings : 14th International Symposium, NFM 2022, Pasadena, CA, USA, May 24\u201327, 2022, Proceedings. vol. 13260, Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 13260 LNCS, Springer, Cham, pp. 193-212, NASA Formal Methods 2022, Pasadena, California, United States, 24/05/22. https://doi.org/10.1007/978-3-031-06773-0_10","raw_type":"contributionToPeriodical"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7300000190734863,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1497573972","https://openalex.org/W1507199453","https://openalex.org/W1834963927","https://openalex.org/W1862398452","https://openalex.org/W1972910244","https://openalex.org/W1975219867","https://openalex.org/W2052092737","https://openalex.org/W2125299871","https://openalex.org/W2157807654","https://openalex.org/W2260756217","https://openalex.org/W2575705757","https://openalex.org/W2602950602","https://openalex.org/W2787908307","https://openalex.org/W2798694585","https://openalex.org/W2811374584","https://openalex.org/W2883622352","https://openalex.org/W2906997088","https://openalex.org/W2921516508","https://openalex.org/W2953466973","https://openalex.org/W2963575966","https://openalex.org/W2963600714","https://openalex.org/W2966735560","https://openalex.org/W2967595108","https://openalex.org/W2968983352","https://openalex.org/W2981739602","https://openalex.org/W3082528606","https://openalex.org/W3093055384","https://openalex.org/W3099114572","https://openalex.org/W3104371626","https://openalex.org/W3152346276","https://openalex.org/W3159199672","https://openalex.org/W3165816975","https://openalex.org/W3173598197","https://openalex.org/W3215640983","https://openalex.org/W3216656735","https://openalex.org/W4230164823","https://openalex.org/W4283819375","https://openalex.org/W6675354045","https://openalex.org/W6814003322"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W1985560493","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W4225269853","https://openalex.org/W3168977894"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-18T07:56:08.524223","created_date":"2025-10-10T00:00:00"}
