{"id":"https://openalex.org/W6924371658","doi":"https://doi.org/10.15168/11572_375447","title":"Evolutionary Optimization of Decision Trees for Interpretable Reinforcement Learning","display_name":"Evolutionary Optimization of Decision Trees for Interpretable Reinforcement Learning","publication_year":2023,"publication_date":"2023-04-27","ids":{"openalex":"https://openalex.org/W6924371658","doi":"https://doi.org/10.15168/11572_375447"},"language":"en","primary_location":{"id":"pmh:oai:iris.unitn.it:11572/375447","is_oa":true,"landing_page_url":"https://hdl.handle.net/11572/375447","pdf_url":null,"source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/doctoralThesis"},"type":"other","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/11572/375447","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Custode, Leonardo Lucio","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Custode, Leonardo Lucio","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5123000144958496},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.45890000462532043},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.32910001277923584},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.30809998512268066},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.2935999929904938},{"id":"https://openalex.org/keywords/genetic-programming","display_name":"Genetic programming","score":0.28060001134872437}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6349999904632568},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5263000130653381},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5123000144958496},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48339998722076416},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.45890000462532043},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.30809998512268066},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2872999906539917},{"id":"https://openalex.org/C110332635","wikidata":"https://www.wikidata.org/wiki/Q629498","display_name":"Genetic programming","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.25529998540878296},{"id":"https://openalex.org/C5481197","wikidata":"https://www.wikidata.org/wiki/Q16766476","display_name":"Decision tree learning","level":3,"score":0.25519999861717224}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:iris.unitn.it:11572/375447","is_oa":true,"landing_page_url":"https://hdl.handle.net/11572/375447","pdf_url":null,"source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/doctoralThesis"},{"id":"doi:10.15168/11572_375447","is_oa":true,"landing_page_url":"https://doi.org/10.15168/11572_375447","pdf_url":null,"source":{"id":"https://openalex.org/S7407051007","display_name":"Universit\u00e0 degli Studi di Trento","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:iris.unitn.it:11572/375447","is_oa":true,"landing_page_url":"https://hdl.handle.net/11572/375447","pdf_url":null,"source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/doctoralThesis"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"Artificial":[1],"Intelligence":[2],"(AI)":[3],"is":[4,9,40,80],"making":[5],"giant":[6],"steps,":[7],"it":[8],"also":[10],"raising":[11],"concerns":[12],"about":[13],"its":[14],"trustworthiness,":[15],"due":[16],"to":[17,34,41,72,133,140,165],"the":[18,32,92,137,158,170,179,183],"fact":[19],"that":[20,48,152],"widely-used":[21],"black-box":[22,77],"models":[23,47,61],"cannot":[24],"be":[25,50,73],"exactly":[26],"understood":[27,52],"by":[28,53,122,176],"humans.":[29],"One":[30],"of":[31,94,136,173,182],"ways":[33],"improve":[35],"humans\u2019":[36],"trust":[37],"towards":[38],"AI":[39,44,60,175],"use":[42],"interpretable":[43,59,100],"models,":[45],"i.e.,":[46],"can":[49],"thoroughly":[51],"humans,":[54],"and":[55],"thus":[56],"trusted.":[57],"However,":[58],"are":[62,70,155],"not":[63],"typically":[64],"used":[65],"in":[66,83,144],"practice,":[67],"as":[68],"they":[69],"thought":[71],"less":[74],"performing":[75,95],"than":[76],"models.":[78,101],"This":[79],"more":[81],"evident":[82],"Reinforce-":[84,96],"ment":[85,97],"Learning,":[86],"where":[87],"relatively":[88],"little":[89],"work":[90],"addresses":[91],"problem":[93],"Learning":[98,125,146],"with":[99,126,157],"In":[102],"this":[103,107,116],"thesis,":[104],"we":[105,118,168],"address":[106],"gap,":[108],"proposing":[109],"methods":[110],"for":[111],"Interpretable":[112,174],"Reinforcement":[113,124,145],"Learning.":[114],"For":[115],"purpose,":[117],"optimize":[119],"Decision":[120,142],"Trees":[121,143],"combining":[123],"Evolutionary":[127],"Computation":[128],"techniques,":[129],"which":[130],"allows":[131],"us":[132],"overcome":[134],"some":[135],"challenges":[138],"tied":[139],"optimizing":[141],"scenarios.":[147],"The":[148],"experimental":[149],"results":[150],"show":[151,169],"these":[153],"approaches":[154],"competitive":[156],"state-of-the-art":[159],"score":[160],"while":[161],"being":[162],"extremely":[163],"easier":[164],"interpret.":[166],"Finally,":[167],"practical":[171],"importance":[172],"digging":[177],"into":[178],"inner":[180],"working":[181],"solutions":[184],"obtained.":[185]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}