{"id":"https://openalex.org/W2021865944","doi":"https://doi.org/10.7148/2014-0352","title":"Reusable Reinforcement Learning for Modular Self Motivated Agents","display_name":"Reusable Reinforcement Learning for Modular Self Motivated Agents","publication_year":2014,"publication_date":"2014-05-27","ids":{"openalex":"https://openalex.org/W2021865944","doi":"https://doi.org/10.7148/2014-0352","mag":"2021865944"},"language":"en","primary_location":{"id":"doi:10.7148/2014-0352","is_oa":false,"landing_page_url":"https://doi.org/10.7148/2014-0352","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ECMS 2014 Proceedings edited by: Flaminio Squazzoni, Fabio Baronio, Claudia Archetti, Marco Castellani","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053986921","display_name":"Jaroslav V\u00edtk\u016f","orcid":"https://orcid.org/0000-0002-8928-4104"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Jaroslav Vitku","raw_affiliation_strings":["Czech Technical Univ. in Prague"],"affiliations":[{"raw_affiliation_string":"Czech Technical Univ. in Prague","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058831673","display_name":"Pavel Nahodil","orcid":null},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Pavel Nahodil","raw_affiliation_strings":["Czech Technical Univ. in Prague"],"affiliations":[{"raw_affiliation_string":"Czech Technical Univ. in Prague","institution_ids":["https://openalex.org/I44504214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5053986921"],"corresponding_institution_ids":["https://openalex.org/I44504214"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07145459,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"352","last_page":"358"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8678276538848877},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.8086612224578857},{"id":"https://openalex.org/keywords/modularity","display_name":"Modularity (biology)","score":0.773064136505127},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.771715521812439},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5434198379516602},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4979732036590576},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47720298171043396},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.37958231568336487},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33674734830856323},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17757800221443176}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8678276538848877},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.8086612224578857},{"id":"https://openalex.org/C2779478453","wikidata":"https://www.wikidata.org/wiki/Q6889748","display_name":"Modularity (biology)","level":2,"score":0.773064136505127},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.771715521812439},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5434198379516602},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4979732036590576},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47720298171043396},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.37958231568336487},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33674734830856323},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17757800221443176},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.7148/2014-0352","is_oa":false,"landing_page_url":"https://doi.org/10.7148/2014-0352","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ECMS 2014 Proceedings edited by: Flaminio Squazzoni, Fabio Baronio, Claudia Archetti, Marco Castellani","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W101771737","https://openalex.org/W639309485","https://openalex.org/W1502872058","https://openalex.org/W1986871538","https://openalex.org/W1999925021","https://openalex.org/W2045257906","https://openalex.org/W2117502083","https://openalex.org/W2141458086","https://openalex.org/W2164653071","https://openalex.org/W2170942403","https://openalex.org/W2901136733"],"related_works":["https://openalex.org/W2297768894","https://openalex.org/W2378076731","https://openalex.org/W3109014690","https://openalex.org/W2122405502","https://openalex.org/W2114254072","https://openalex.org/W2127721729","https://openalex.org/W2884798239","https://openalex.org/W1531253727","https://openalex.org/W2366669483","https://openalex.org/W2333635112"],"abstract_inverted_index":{"Presented":[0],"topic":[1],"is":[2,18,31,89,108,121],"from":[3],"the":[4,83,97],"research":[5],"fields":[6],"called":[7],"Artificial":[8,11],"Life":[9],"and":[10,39,117],"Intelligence":[12],"(AI).":[13],"In":[14],"this":[15],"paper,":[16],"there":[17],"presented":[19],"novel":[20,84],"approach":[21,30],"to":[22],"designing":[23],"agent":[24,40,106],"architectures":[25,41,88,107],"with":[26,92],"its":[27],"requirements.":[28],"The":[29,71],"inspired":[32],"by":[33],"inherited":[34],"modularity":[35],"of":[36,47,60,99,105,113],"biological":[37],"brains":[38],"are":[42,73],"represented":[43],"here":[44],"as":[45],"set":[46],"given":[48],"reusable":[49,102],"modules":[50,63,72],"connected":[51],"into":[52],"a":[53,93],"particular":[54,62],"topology.":[55],"This":[56],"paper":[57],"presents":[58],"design":[59,98],"two":[61,100],"for":[64,75,86],"future":[65,119],"use":[66,120],"in":[67],"more":[68],"complex":[69],"architectures.":[70],"used":[74,94],"implementing":[76],"model-free":[77],"motivation-driven":[78],"Reinforcement":[79],"Learning":[80],"(RL).":[81],"First,":[82],"framework":[85],"these":[87,114],"described":[90],"together":[91],"simulator.":[95],"Then,":[96],"new":[101,115],"domain-independent":[103],"components":[104,116],"described.":[109],"Finally,":[110],"experimental":[111],"validation":[112],"their":[118],"mentioned.":[122]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
