{"id":"https://openalex.org/W3130386886","doi":"https://doi.org/10.1109/iros45743.2020.9341589","title":"Markov Decision Processes with Unknown State Feature Values for Safe Exploration using Gaussian Processes","display_name":"Markov Decision Processes with Unknown State Feature Values for Safe Exploration using Gaussian Processes","publication_year":2020,"publication_date":"2020-10-24","ids":{"openalex":"https://openalex.org/W3130386886","doi":"https://doi.org/10.1109/iros45743.2020.9341589","mag":"3130386886"},"language":"en","primary_location":{"id":"doi:10.1109/iros45743.2020.9341589","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9341589","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.manchester.ac.uk/en/publications/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086516575","display_name":"Matthew Budd","orcid":"https://orcid.org/0000-0002-7798-8438"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Matthew Budd","raw_affiliation_strings":["Dept. of Engineering Science, University of Oxford"],"affiliations":[{"raw_affiliation_string":"Dept. of Engineering Science, University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053556869","display_name":"Bruno Lacerda","orcid":"https://orcid.org/0000-0003-0862-331X"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Bruno Lacerda","raw_affiliation_strings":["Dept. of Engineering Science, University of Oxford"],"affiliations":[{"raw_affiliation_string":"Dept. of Engineering Science, University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063524295","display_name":"Paul Duckworth","orcid":"https://orcid.org/0000-0001-9052-6919"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Duckworth","raw_affiliation_strings":["Dept. of Engineering Science, University of Oxford"],"affiliations":[{"raw_affiliation_string":"Dept. of Engineering Science, University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102970482","display_name":"Andrew West","orcid":"https://orcid.org/0000-0003-4553-8640"},"institutions":[{"id":"https://openalex.org/I28407311","display_name":"University of Manchester","ror":"https://ror.org/027m9bs27","country_code":"GB","type":"education","lineage":["https://openalex.org/I28407311"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrew West","raw_affiliation_strings":["Dept. of Electrical and Electronic Engineering, University of Manchester"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Electronic Engineering, University of Manchester","institution_ids":["https://openalex.org/I28407311"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011590665","display_name":"Barry Lennox","orcid":"https://orcid.org/0000-0003-0905-8324"},"institutions":[{"id":"https://openalex.org/I28407311","display_name":"University of Manchester","ror":"https://ror.org/027m9bs27","country_code":"GB","type":"education","lineage":["https://openalex.org/I28407311"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Barry Lennox","raw_affiliation_strings":["Dept. of Electrical and Electronic Engineering, University of Manchester"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Electronic Engineering, University of Manchester","institution_ids":["https://openalex.org/I28407311"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059686746","display_name":"Nick Hawes","orcid":"https://orcid.org/0000-0002-7556-6098"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nick Hawes","raw_affiliation_strings":["Dept. of Engineering Science, University of Oxford"],"affiliations":[{"raw_affiliation_string":"Dept. of Engineering Science, University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5086516575"],"corresponding_institution_ids":["https://openalex.org/I40120149"],"apc_list":null,"apc_paid":null,"fwci":1.2234,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.8475232,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"7344","last_page":"7350"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10711","display_name":"Target Tracking and Data Fusion in Sensor Networks","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6238037347793579},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5520209074020386},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5503409504890442},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.5252330303192139},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5206717252731323},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5146361589431763},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.5130630731582642},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.48630771040916443},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46507737040519714},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36332035064697266},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3522570729255676},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32746434211730957},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.27356892824172974},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19699198007583618},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.14698761701583862}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6238037347793579},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5520209074020386},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5503409504890442},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.5252330303192139},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5206717252731323},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5146361589431763},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.5130630731582642},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.48630771040916443},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46507737040519714},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36332035064697266},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3522570729255676},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32746434211730957},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.27356892824172974},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19699198007583618},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.14698761701583862},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iros45743.2020.9341589","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9341589","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Budd, M, Lacerda, B, Duckworth, P, West, A, Lennox, B & Hawes, N 2020, Markov Decision Processes with Unknown State Feature Values for Safe Exploration using Gaussian Processes. in 2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS). IEEE, pp. 7344-7350. https://doi.org/10.1109/IROS45743.2020.9341589","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:ora.ox.ac.uk:uuid:f790bb7f-5f16-4aa2-af7f-43f759a57648","is_oa":false,"landing_page_url":"https://ora.ox.ac.uk/objects/uuid:f790bb7f-5f16-4aa2-af7f-43f759a57648","pdf_url":null,"source":{"id":"https://openalex.org/S4306402636","display_name":"Oxford University Research Archive (ORA) (University of Oxford)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I40120149","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/I40120149"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Symplectic Elements","raw_type":"Conference item"},{"id":"pmh:oai:pure.atira.dk:publications/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","is_oa":false,"landing_page_url":"https://www.research.manchester.ac.uk/portal/en/publications/markov-decision-processes-with-unknown-state-feature-values-for-safe-exploration-using-gaussian-processes(ae2bc1d9-65f5-4114-b4f5-39d74f89fede).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/ae2bc1d9-65f5-4114-b4f5-39d74f89fede","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Budd, M, Lacerda, B, Duckworth, P, West, A, Lennox, B & Hawes, N 2020, Markov Decision Processes with Unknown State Feature Values for Safe Exploration using Gaussian Processes. in 2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS). IEEE, pp. 7344-7350. https://doi.org/10.1109/IROS45743.2020.9341589","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"score":0.4399999976158142,"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15"}],"awards":[{"id":"https://openalex.org/G2513151266","display_name":null,"funder_award_id":"EP/R026084","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"},{"id":"https://openalex.org/G2838024195","display_name":"UK Robotics and Artificial Intelligence Hub for Offshore Energy Asset Integrity Management","funder_award_id":"EP/R026173/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G2898516364","display_name":null,"funder_award_id":"EP/R026084","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4483049737","display_name":null,"funder_award_id":"EP/R026173/1","funder_id":"https://openalex.org/F4320334245","funder_display_name":"Offshore Robotics for Certification of Assets"},{"id":"https://openalex.org/G6465377262","display_name":"Robotics and Artificial Intelligence for Nuclear (RAIN)","funder_award_id":"EP/R026084/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6732448074","display_name":null,"funder_award_id":"EP/R026084/1","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"},{"id":"https://openalex.org/G8602921712","display_name":null,"funder_award_id":"EP/R026173","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320334245","display_name":"Offshore Robotics for Certification of Assets","ror":null},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W202180931","https://openalex.org/W1746819321","https://openalex.org/W1862398452","https://openalex.org/W1984338812","https://openalex.org/W2120034667","https://openalex.org/W2151237105","https://openalex.org/W2168359464","https://openalex.org/W2221184070","https://openalex.org/W2427917354","https://openalex.org/W2540189295","https://openalex.org/W2594930926","https://openalex.org/W2606818146","https://openalex.org/W2758731390","https://openalex.org/W2788084076","https://openalex.org/W2883481555","https://openalex.org/W2917643801","https://openalex.org/W2951796861","https://openalex.org/W2963958573","https://openalex.org/W2964150011","https://openalex.org/W2971013032","https://openalex.org/W2982550324","https://openalex.org/W3104558707","https://openalex.org/W4211049957","https://openalex.org/W4230164823","https://openalex.org/W4288560619","https://openalex.org/W4297780563","https://openalex.org/W4301091646","https://openalex.org/W6638944184","https://openalex.org/W6677959772","https://openalex.org/W6682367392","https://openalex.org/W6689175234","https://openalex.org/W6717915398","https://openalex.org/W6759668376","https://openalex.org/W6767408606","https://openalex.org/W6845059051"],"related_works":["https://openalex.org/W2379651310","https://openalex.org/W2113019827","https://openalex.org/W1541249122","https://openalex.org/W2413828414","https://openalex.org/W2315999538","https://openalex.org/W2367222340","https://openalex.org/W187740018","https://openalex.org/W2162286586","https://openalex.org/W4255368532","https://openalex.org/W1964286703"],"abstract_inverted_index":{"When":[0],"exploring":[1,26,204],"an":[2,73,118,143,205],"unknown":[3,208],"environment,":[4],"a":[5,67,70,77,102,123,190,199,206],"mobile":[6],"robot":[7,41,58,71,203],"must":[8,15],"decide":[9],"where":[10,45,69],"to":[11,31,39,61,82,105,148,176],"observe":[12],"next.":[13],"It":[14],"do":[16],"this":[17,35,139],"whilst":[18],"minimising":[19],"the":[20,40,57,85,107,110,127,132,158,161,169,181,196],"risk":[21],"of":[22,87,109,171,198],"failure,":[23],"by":[24,173],"only":[25,95],"areas":[27],"that":[28,125],"it":[29],"expects":[30],"be":[32,96],"safe.":[33],"In":[34],"context,":[36],"safety":[37],"refers":[38],"remaining":[42],"in":[43,113],"regions":[44],"critical":[46],"environment":[47,74,91,111,133],"features":[48,92],"(e.g.":[49],"terrain":[50],"steepness,":[51],"radiation":[52,193],"levels)":[53],"are":[54],"within":[55],"ranges":[56],"is":[59],"able":[60],"tolerate.":[62],"More":[63],"specifically,":[64],"we":[65,141],"consider":[66],"setting":[68],"explores":[72],"modelled":[75],"with":[76,131],"Markov":[78,120],"decision":[79,121],"process,":[80,122],"subject":[81],"bounds":[83],"on":[84,138,189],"values":[86],"one":[88],"or":[89],"more":[90],"which":[93],"can":[94],"sensed":[97],"at":[98],"runtime.":[99],"We":[100,185],"use":[101],"Gaussian":[103,128,162],"process":[104,129,163],"predict":[106],"value":[108],"feature":[112],"unvisited":[114],"regions,":[115],"and":[116,154],"propose":[117,142],"estimated":[119],"model":[124,134],"integrates":[126],"predictions":[130],"transition":[135],"probabilities.":[136],"Building":[137],"model,":[140],"exploration":[144,172],"algorithm":[145],"that,":[146],"contrary":[147],"previous":[149],"approaches,":[150],"considers":[151],"probabilistic":[152],"transitions":[153],"explicitly":[155],"reasons":[156],"about":[157],"uncertainty":[159],"over":[160],"predictions.":[164],"Furthermore,":[165],"our":[166,187],"approach":[167,188],"increases":[168],"speed":[170],"selecting":[174],"locations":[175],"visit":[177],"further":[178],"away":[179],"from":[180],"currently":[182],"explored":[183],"area.":[184,209],"evaluate":[186],"real-world":[191],"gamma":[192],"dataset,":[194],"tackling":[195],"challenge":[197],"nuclear":[200],"material":[201],"inspection":[202],"priori":[207]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
