{"id":"https://openalex.org/W4389157012","doi":"https://doi.org/10.48550/arxiv.2311.16838","title":"Increasing Transparency of Reinforcement Learning using Shielding for Human Preferences and Explanations","display_name":"Increasing Transparency of Reinforcement Learning using Shielding for Human Preferences and Explanations","publication_year":2023,"publication_date":"2023-11-28","ids":{"openalex":"https://openalex.org/W4389157012","doi":"https://doi.org/10.48550/arxiv.2311.16838"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2311.16838","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.16838","pdf_url":"https://arxiv.org/pdf/2311.16838","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2311.16838","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022428889","display_name":"Georgios Angelopoulos","orcid":"https://orcid.org/0000-0001-9866-8719"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Angelopoulos, Georgios","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067221718","display_name":"Luigi Mangiacapra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mangiacapra, Luigi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031968626","display_name":"Alessandra Rossi","orcid":"https://orcid.org/0000-0003-1362-8799"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rossi, Alessandra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079088287","display_name":"Claudia Di Napoli","orcid":"https://orcid.org/0000-0002-8626-5805"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Di Napoli, Claudia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5046630253","display_name":"Silvia Rossi","orcid":"https://orcid.org/0000-0002-3379-1756"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rossi, Silvia","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5022428889"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.965499997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.965499997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9200000166893005,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9197999835014343,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.8860176801681519},{"id":"https://openalex.org/keywords/legibility","display_name":"Legibility","score":0.7715516090393066},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7291818261146545},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6887438297271729},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.5963389873504639},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5641103982925415},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5339803695678711},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.5330592393875122},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5122115015983582},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.48443010449409485},{"id":"https://openalex.org/keywords/human-in-the-loop","display_name":"Human-in-the-loop","score":0.4194953739643097},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.34292322397232056},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.20976626873016357},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.1639658510684967},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.12259477376937866},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.08440268039703369}],"concepts":[{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.8860176801681519},{"id":"https://openalex.org/C2779332521","wikidata":"https://www.wikidata.org/wiki/Q1820694","display_name":"Legibility","level":2,"score":0.7715516090393066},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7291818261146545},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6887438297271729},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.5963389873504639},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5641103982925415},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5339803695678711},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.5330592393875122},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5122115015983582},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.48443010449409485},{"id":"https://openalex.org/C2780626000","wikidata":"https://www.wikidata.org/wiki/Q5936775","display_name":"Human-in-the-loop","level":2,"score":0.4194953739643097},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.34292322397232056},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.20976626873016357},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.1639658510684967},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.12259477376937866},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.08440268039703369},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2311.16838","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.16838","pdf_url":"https://arxiv.org/pdf/2311.16838","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2311.16838","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2311.16838","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2311.16838","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.16838","pdf_url":"https://arxiv.org/pdf/2311.16838","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.8199999928474426,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4389157012.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W565076200","https://openalex.org/W2473574490","https://openalex.org/W2406065423","https://openalex.org/W1989753795","https://openalex.org/W3133699834","https://openalex.org/W4388430323","https://openalex.org/W4377866454","https://openalex.org/W2113355126","https://openalex.org/W2542622692","https://openalex.org/W3113143399"],"abstract_inverted_index":{"The":[0],"adoption":[1],"of":[2,22,90,133,191,199],"Reinforcement":[3],"Learning":[4],"(RL)":[5],"in":[6,77,102,131,138,179,185,212],"several":[7],"human-centred":[8],"applications":[9,209],"provides":[10],"robots":[11,59],"with":[12,151,161,210],"autonomous":[13],"decision-making":[14],"capabilities":[15],"and":[16,38,46,110,136,157,189,203],"adaptability":[17],"based":[18],"on":[19],"the":[20,23,30,66,80,82,88,103,113,128,164,167,186,192,197,213],"observations":[21],"operating":[24],"environment.":[25],"In":[26,68],"such":[27],"scenarios,":[28],"however,":[29],"learning":[31,114,148,202],"process":[32],"can":[33],"make":[34],"robots'":[35],"behaviours":[36],"unclear":[37,64],"unpredictable":[39],"to":[40,57,65,106,111,126,153,182],"humans,":[41],"thus":[42],"preventing":[43],"a":[44,52,91,97,120,205],"smooth":[45],"effective":[47],"Human-Robot":[48],"Interaction":[49],"(HRI).":[50],"As":[51],"consequence,":[53],"it":[54],"becomes":[55],"crucial":[56],"avoid":[58],"performing":[60],"actions":[61,81],"that":[62,143,176],"are":[63],"user.":[67],"this":[69,95],"work,":[70],"we":[71],"investigate":[72],"whether":[73],"including":[74],"human":[75,108,145,159,211],"preferences":[76,109,146,160],"RL":[78,104],"(concerning":[79],"robot":[83],"performs":[84],"during":[85,147,201],"learning)":[86],"improves":[87,149],"transparency":[89,130,180,200],"robot's":[92,129,168],"behaviours.":[93],"For":[94],"purpose,":[96],"shielding":[98],"mechanism":[99],"is":[100],"included":[101],"algorithm":[105],"include":[107],"monitor":[112],"agent's":[115],"decisions.":[116],"We":[117],"carried":[118],"out":[119],"within-subjects":[121],"study":[122],"involving":[123],"26":[124],"participants":[125],"evaluate":[127],"terms":[132],"Legibility,":[134],"Predictability,":[135],"Expectability":[137],"different":[139],"settings.":[140],"Results":[141,173],"indicate":[142],"considering":[144],"Legibility":[150],"respect":[152],"providing":[154],"only":[155],"Explanations,":[156],"combining":[158],"explanations":[162],"elucidating":[163],"rationale":[165],"behind":[166],"decisions":[169],"further":[170],"amplifies":[171],"transparency.":[172],"also":[174],"confirm":[175],"an":[177,183],"increase":[178,184],"leads":[181],"safety,":[187],"comfort,":[188],"reliability":[190],"robot.":[193],"These":[194],"findings":[195],"show":[196],"importance":[198],"suggest":[204],"paradigm":[206],"for":[207],"robotic":[208],"loop.":[214]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2023-11-30T00:00:00"}
