{"id":"https://openalex.org/W4408439373","doi":"https://doi.org/10.1016/j.engappai.2025.110520","title":"What is behind the curtain? Increasing transparency in reinforcement learning with human preferences and explanations","display_name":"What is behind the curtain? Increasing transparency in reinforcement learning with human preferences and explanations","publication_year":2025,"publication_date":"2025-03-14","ids":{"openalex":"https://openalex.org/W4408439373","doi":"https://doi.org/10.1016/j.engappai.2025.110520"},"language":"en","primary_location":{"id":"doi:10.1016/j.engappai.2025.110520","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.engappai.2025.110520","pdf_url":null,"source":{"id":"https://openalex.org/S900972176","display_name":"Engineering Applications of Artificial Intelligence","issn_l":"0952-1976","issn":["0952-1976","1873-6769"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Engineering Applications of Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.engappai.2025.110520","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022428889","display_name":"Georgios Angelopoulos","orcid":"https://orcid.org/0000-0001-9866-8719"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Georgios Angelopoulos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067221718","display_name":"Luigi Mangiacapra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luigi Mangiacapra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031968626","display_name":"Alessandra Rossi","orcid":"https://orcid.org/0000-0003-1362-8799"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alessandra Rossi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079088287","display_name":"Claudia Di Napoli","orcid":"https://orcid.org/0000-0002-8626-5805"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Claudia Di Napoli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5046630253","display_name":"Silvia Rossi","orcid":"https://orcid.org/0000-0002-3379-1756"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Silvia Rossi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5022428889"],"corresponding_institution_ids":[],"apc_list":{"value":3170,"currency":"USD","value_usd":3170},"apc_paid":{"value":3170,"currency":"USD","value_usd":3170},"fwci":2.8599,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89896931,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"149","issue":null,"first_page":"110520","last_page":"110520"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10042","display_name":"Neural and Behavioral Psychology Studies","score":0.930899977684021,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9203000068664551,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8723165988922119},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.7398947477340698},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7233537435531616},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.48893919587135315},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3529456555843353},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.22821980714797974}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8723165988922119},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.7398947477340698},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7233537435531616},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.48893919587135315},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3529456555843353},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.22821980714797974}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.engappai.2025.110520","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.engappai.2025.110520","pdf_url":null,"source":{"id":"https://openalex.org/S900972176","display_name":"Engineering Applications of Artificial Intelligence","issn_l":"0952-1976","issn":["0952-1976","1873-6769"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Engineering Applications of Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.engappai.2025.110520","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.engappai.2025.110520","pdf_url":null,"source":{"id":"https://openalex.org/S900972176","display_name":"Engineering Applications of Artificial Intelligence","issn_l":"0952-1976","issn":["0952-1976","1873-6769"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Engineering Applications of Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1967441381","https://openalex.org/W2054908983","https://openalex.org/W2515293759","https://openalex.org/W2574287525","https://openalex.org/W2608389450","https://openalex.org/W2746969613","https://openalex.org/W2803451925","https://openalex.org/W2898227854","https://openalex.org/W2902263534","https://openalex.org/W2952799618","https://openalex.org/W2963575966","https://openalex.org/W2968357651","https://openalex.org/W2978550519","https://openalex.org/W2995473109","https://openalex.org/W3026623972","https://openalex.org/W3037826640","https://openalex.org/W3095030303","https://openalex.org/W3119077469","https://openalex.org/W3121647461","https://openalex.org/W3128013500","https://openalex.org/W3152787394","https://openalex.org/W3164011142","https://openalex.org/W3181692234","https://openalex.org/W3188815642","https://openalex.org/W3208134787","https://openalex.org/W3213330367","https://openalex.org/W4210718321","https://openalex.org/W4220654348","https://openalex.org/W4245423772","https://openalex.org/W4285194984","https://openalex.org/W4294147137","https://openalex.org/W4307593158","https://openalex.org/W4310429478","https://openalex.org/W4312747053","https://openalex.org/W4319162364","https://openalex.org/W4321780050","https://openalex.org/W4322503739","https://openalex.org/W4323870299","https://openalex.org/W4388666651","https://openalex.org/W4392634027","https://openalex.org/W4403225923","https://openalex.org/W6644367652","https://openalex.org/W6680185541","https://openalex.org/W6731773099","https://openalex.org/W6743368274","https://openalex.org/W6774623367","https://openalex.org/W6784533164","https://openalex.org/W6786122292","https://openalex.org/W6803459319","https://openalex.org/W6803686803","https://openalex.org/W6805162643","https://openalex.org/W6809337039","https://openalex.org/W6846317009","https://openalex.org/W6848290183","https://openalex.org/W6850102032","https://openalex.org/W6857161875","https://openalex.org/W6858555477","https://openalex.org/W6858710369","https://openalex.org/W6858783343","https://openalex.org/W6873522973","https://openalex.org/W6892495207"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3081288631","https://openalex.org/W3152382318","https://openalex.org/W3004686567","https://openalex.org/W2738656338","https://openalex.org/W2603787370","https://openalex.org/W2555400967","https://openalex.org/W3214759741"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
