{"id":"https://openalex.org/W2948994298","doi":"https://doi.org/10.1109/devlrn.2019.8850713","title":"Autonomous Reinforcement Learning of Multiple Interrelated Tasks","display_name":"Autonomous Reinforcement Learning of Multiple Interrelated Tasks","publication_year":2019,"publication_date":"2019-08-01","ids":{"openalex":"https://openalex.org/W2948994298","doi":"https://doi.org/10.1109/devlrn.2019.8850713","mag":"2948994298"},"language":"en","primary_location":{"id":"doi:10.1109/devlrn.2019.8850713","is_oa":false,"landing_page_url":"https://doi.org/10.1109/devlrn.2019.8850713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 Joint IEEE 9th International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1906.01374","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012368267","display_name":"Vieri Giuliano Santucci","orcid":"https://orcid.org/0000-0002-8748-9632"},"institutions":[{"id":"https://openalex.org/I4210166865","display_name":"Institute of Cognitive Sciences and Technologies","ror":"https://ror.org/05w9g2j85","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210155236","https://openalex.org/I4210166865"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"funder","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Vieri Giuliano Santucci","raw_affiliation_strings":["Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","National Research Council - Italy#TAB#"],"affiliations":[{"raw_affiliation_string":"Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","institution_ids":["https://openalex.org/I4210166865","https://openalex.org/I4210155236"]},{"raw_affiliation_string":"National Research Council - Italy#TAB#","institution_ids":["https://openalex.org/I4210155236"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076711458","display_name":"Gianluca Baldassarre","orcid":"https://orcid.org/0000-0002-1277-4447"},"institutions":[{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"funder","lineage":["https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210166865","display_name":"Institute of Cognitive Sciences and Technologies","ror":"https://ror.org/05w9g2j85","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210155236","https://openalex.org/I4210166865"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gianluca Baldassarre","raw_affiliation_strings":["Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","National Research Council - Italy#TAB#"],"affiliations":[{"raw_affiliation_string":"Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","institution_ids":["https://openalex.org/I4210166865","https://openalex.org/I4210155236"]},{"raw_affiliation_string":"National Research Council - Italy#TAB#","institution_ids":["https://openalex.org/I4210155236"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011429131","display_name":"Emilio Cartoni","orcid":"https://orcid.org/0000-0001-8026-5145"},"institutions":[{"id":"https://openalex.org/I4210166865","display_name":"Institute of Cognitive Sciences and Technologies","ror":"https://ror.org/05w9g2j85","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210155236","https://openalex.org/I4210166865"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"funder","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Emilio Cartoni","raw_affiliation_strings":["Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","National Research Council - Italy#TAB#"],"affiliations":[{"raw_affiliation_string":"Istituto di Scienze e Tecnologie della Cognizione (ISTC), Consiglio Nazionale delle Ricerche (CNR), Rome, Italy","institution_ids":["https://openalex.org/I4210166865","https://openalex.org/I4210155236"]},{"raw_affiliation_string":"National Research Council - Italy#TAB#","institution_ids":["https://openalex.org/I4210155236"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5012368267"],"corresponding_institution_ids":["https://openalex.org/I4210155236","https://openalex.org/I4210166865"],"apc_list":null,"apc_paid":null,"fwci":0.289,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65704499,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"221","last_page":"227"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7047408819198608},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6793920397758484},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6728882193565369},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.6231865286827087},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5975642800331116},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.5337819457054138},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5080907344818115},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49303385615348816},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.46068599820137024},{"id":"https://openalex.org/keywords/competence","display_name":"Competence (human resources)","score":0.4378894567489624},{"id":"https://openalex.org/keywords/autonomous-agent","display_name":"Autonomous agent","score":0.4355964660644531},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4279128313064575},{"id":"https://openalex.org/keywords/autonomous-learning","display_name":"Autonomous learning","score":0.4182230234146118},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.2128620445728302},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12992313504219055},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.07176125049591064},{"id":"https://openalex.org/keywords/mathematics-education","display_name":"Mathematics education","score":0.06627500057220459},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.06588304042816162}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7047408819198608},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6793920397758484},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6728882193565369},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.6231865286827087},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5975642800331116},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.5337819457054138},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5080907344818115},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49303385615348816},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.46068599820137024},{"id":"https://openalex.org/C100521375","wikidata":"https://www.wikidata.org/wiki/Q2015382","display_name":"Competence (human resources)","level":2,"score":0.4378894567489624},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.4355964660644531},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4279128313064575},{"id":"https://openalex.org/C2983271839","wikidata":"https://www.wikidata.org/wiki/Q29644074","display_name":"Autonomous learning","level":2,"score":0.4182230234146118},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2128620445728302},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12992313504219055},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.07176125049591064},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.06627500057220459},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.06588304042816162},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/devlrn.2019.8850713","is_oa":false,"landing_page_url":"https://doi.org/10.1109/devlrn.2019.8850713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 Joint IEEE 9th International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1906.01374","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.01374","pdf_url":"https://arxiv.org/pdf/1906.01374","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2948994298","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1906.01374v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1906.01374","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1906.01374","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"doi:10.57702/hhpuzat1","is_oa":true,"landing_page_url":"https://doi.org/10.57702/hhpuzat1","pdf_url":null,"source":{"id":"https://openalex.org/S7407053387","display_name":"TIB Data Manager","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1906.01374","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.01374","pdf_url":"https://arxiv.org/pdf/1906.01374","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5880680131","display_name":null,"funder_award_id":"713010","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8051717526","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2948994298.pdf","grobid_xml":"https://content.openalex.org/works/W2948994298.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W355724390","https://openalex.org/W1578521162","https://openalex.org/W1592847719","https://openalex.org/W1952489873","https://openalex.org/W1975744985","https://openalex.org/W2004303440","https://openalex.org/W2007813200","https://openalex.org/W2022163520","https://openalex.org/W2034806191","https://openalex.org/W2036930518","https://openalex.org/W2101524054","https://openalex.org/W2110525007","https://openalex.org/W2113501460","https://openalex.org/W2121863487","https://openalex.org/W2122480991","https://openalex.org/W2220413658","https://openalex.org/W2313007200","https://openalex.org/W2334036380","https://openalex.org/W2401657790","https://openalex.org/W2540177913","https://openalex.org/W2562000796","https://openalex.org/W2734477678","https://openalex.org/W2744921630","https://openalex.org/W2750611126","https://openalex.org/W2768837692","https://openalex.org/W2787066086","https://openalex.org/W2787257245","https://openalex.org/W2788489172","https://openalex.org/W2795520063","https://openalex.org/W2802613770","https://openalex.org/W2804392443","https://openalex.org/W2897673281","https://openalex.org/W2912646464","https://openalex.org/W2963099939","https://openalex.org/W2963262099","https://openalex.org/W2963293881","https://openalex.org/W4214717370","https://openalex.org/W6634579893","https://openalex.org/W6703271639","https://openalex.org/W6728924199","https://openalex.org/W6737937804","https://openalex.org/W6743822824","https://openalex.org/W6748186125","https://openalex.org/W6750013982","https://openalex.org/W7020075990","https://openalex.org/W7026642341"],"related_works":["https://openalex.org/W2979165213","https://openalex.org/W2944701639","https://openalex.org/W3110170303","https://openalex.org/W2591592925","https://openalex.org/W3209494879","https://openalex.org/W3166801429","https://openalex.org/W2123412355","https://openalex.org/W3116833835","https://openalex.org/W2470629089","https://openalex.org/W1975865536","https://openalex.org/W2990208804","https://openalex.org/W1832605823","https://openalex.org/W3110720663","https://openalex.org/W2312863950","https://openalex.org/W2583372322","https://openalex.org/W2314200514","https://openalex.org/W3135612216","https://openalex.org/W3090775013","https://openalex.org/W2980712743","https://openalex.org/W3125778298"],"abstract_inverted_index":{"Autonomous":[0],"multiple":[1,118],"tasks":[2,22,120],"learning":[3,46,73],"is":[4,79,128],"a":[5,30],"fundamental":[6],"capability":[7],"to":[8,33,36,41,58,130],"develop":[9],"versatile":[10],"artificial":[11],"agents":[12],"that":[13,29],"can":[14,104],"act":[15],"in":[16,56,65,74,88,96,114],"complex":[17],"environments.":[18],"In":[19],"real-world":[20],"scenarios,":[21],"may":[23],"be":[24,105],"interrelated":[25,63,119],"(or":[26],"\u201chierarchical\u201d)":[27],"so":[28],"robot":[31],"has":[32],"first":[34],"learn":[35],"achieve":[37],"some":[38],"of":[39,62,77,91,111],"them":[40],"set":[42],"the":[43,60,68,89,109,117,126,136],"preconditions":[44],"for":[45],"other":[47],"ones.":[48],"Even":[49],"though":[50],"different":[51],"strategies":[52],"have":[53],"been":[54],"used":[55],"robotics":[57,70],"tackle":[59],"acquisition":[61],"tasks,":[64],"particular":[66,115],"within":[67],"developmental":[69],"framework,":[71],"autonomous":[72],"this":[75,97,102],"kind":[76],"scenarios":[78],"still":[80],"an":[81,123],"open":[82],"question.":[83],"Building":[84],"on":[85,108],"previous":[86],"research":[87],"framework":[90],"intrinsically":[92],"motivated":[93],"open-ended":[94],"learning,":[95],"work":[98],"we":[99],"describe":[100],"how":[101],"question":[103],"addressed":[106],"working":[107],"level":[110],"task":[112],"selection,":[113],"considering":[116],"scenario":[121],"as":[122],"MDP":[124],"where":[125],"system":[127],"trying":[129],"maximise":[131],"its":[132],"competence":[133],"over":[134],"all":[135],"tasks.":[137]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
