{"id":"https://openalex.org/W2164424353","doi":"https://doi.org/10.1109/tamd.2010.2051031","title":"Intrinsically Motivated Reinforcement Learning: An Evolutionary Perspective","display_name":"Intrinsically Motivated Reinforcement Learning: An Evolutionary Perspective","publication_year":2010,"publication_date":"2010-05-28","ids":{"openalex":"https://openalex.org/W2164424353","doi":"https://doi.org/10.1109/tamd.2010.2051031","mag":"2164424353"},"language":"en","primary_location":{"id":"doi:10.1109/tamd.2010.2051031","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tamd.2010.2051031","pdf_url":null,"source":{"id":"https://openalex.org/S108448409","display_name":"IEEE Transactions on Autonomous Mental Development","issn_l":"1943-0604","issn":["1943-0604","1943-0612"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Autonomous Mental Development","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065366930","display_name":"Satinder Singh","orcid":"https://orcid.org/0000-0002-2736-7641"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Satinder Singh","raw_affiliation_strings":["Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077109450","display_name":"Richard L. Lewis","orcid":"https://orcid.org/0000-0001-6403-489X"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard L. Lewis","raw_affiliation_strings":["Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089808068","display_name":"Andrew G. Barto","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew G. Barto","raw_affiliation_strings":["Division of Computer Science and Engineering, University of Massachusetts, Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"Division of Computer Science and Engineering, University of Massachusetts, Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039371251","display_name":"Jonathan Sorg","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Sorg","raw_affiliation_strings":["Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Division of Computer Science and Engineering, University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5065366930"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":31.2518,"has_fulltext":false,"cited_by_count":410,"citation_normalized_percentile":{"value":0.99737952,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"2","issue":"2","first_page":"70","last_page":"82"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8207132816314697},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.7132381200790405},{"id":"https://openalex.org/keywords/intrinsic-motivation","display_name":"Intrinsic motivation","score":0.6235812902450562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5215601921081543},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5015859603881836},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.47828444838523865},{"id":"https://openalex.org/keywords/evolutionary-robotics","display_name":"Evolutionary robotics","score":0.46652042865753174},{"id":"https://openalex.org/keywords/evolutionary-dynamics","display_name":"Evolutionary dynamics","score":0.4143507480621338},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.3826788663864136},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.33844220638275146},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.16251340508460999}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8207132816314697},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.7132381200790405},{"id":"https://openalex.org/C2985564149","wikidata":"https://www.wikidata.org/wiki/Q644302","display_name":"Intrinsic motivation","level":2,"score":0.6235812902450562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5215601921081543},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5015859603881836},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.47828444838523865},{"id":"https://openalex.org/C199505168","wikidata":"https://www.wikidata.org/wiki/Q3267529","display_name":"Evolutionary robotics","level":3,"score":0.46652042865753174},{"id":"https://openalex.org/C171578705","wikidata":"https://www.wikidata.org/wiki/Q5418700","display_name":"Evolutionary dynamics","level":3,"score":0.4143507480621338},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.3826788663864136},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.33844220638275146},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.16251340508460999},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tamd.2010.2051031","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tamd.2010.2051031","pdf_url":null,"source":{"id":"https://openalex.org/S108448409","display_name":"IEEE Transactions on Autonomous Mental Development","issn_l":"1943-0604","issn":["1943-0604","1943-0612"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Autonomous Mental Development","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.180.1045","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.180.1045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-personal.umich.edu/%7Erickl/pubs/singh-lewis-barto-sorg-2010-ieee-draft.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.363.6310","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.363.6310","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-personal.umich.edu/~rickl/pubs/singh-lewis-barto-2010-ieee.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W91121345","https://openalex.org/W172298727","https://openalex.org/W341910993","https://openalex.org/W1486707268","https://openalex.org/W1488197128","https://openalex.org/W1491843047","https://openalex.org/W1499408472","https://openalex.org/W1534035591","https://openalex.org/W1557517019","https://openalex.org/W1572462007","https://openalex.org/W1588195558","https://openalex.org/W1592847719","https://openalex.org/W1777239053","https://openalex.org/W1819200667","https://openalex.org/W1823666162","https://openalex.org/W1890753574","https://openalex.org/W1964986634","https://openalex.org/W1974142402","https://openalex.org/W1989616852","https://openalex.org/W2000514530","https://openalex.org/W2025440394","https://openalex.org/W2034248365","https://openalex.org/W2035737909","https://openalex.org/W2045154514","https://openalex.org/W2052729098","https://openalex.org/W2060066549","https://openalex.org/W2079247031","https://openalex.org/W2091565802","https://openalex.org/W2097381042","https://openalex.org/W2100677568","https://openalex.org/W2101524054","https://openalex.org/W2107726111","https://openalex.org/W2121863487","https://openalex.org/W2122480991","https://openalex.org/W2130750514","https://openalex.org/W2132057084","https://openalex.org/W2135209725","https://openalex.org/W2135995480","https://openalex.org/W2139612737","https://openalex.org/W2148228571","https://openalex.org/W2155511972","https://openalex.org/W2163533082","https://openalex.org/W2164424353","https://openalex.org/W2167815629","https://openalex.org/W2170899200","https://openalex.org/W2236326974","https://openalex.org/W2317722949","https://openalex.org/W2503173364","https://openalex.org/W2592535843","https://openalex.org/W2798944292","https://openalex.org/W2802872143","https://openalex.org/W2998349125","https://openalex.org/W3011120880","https://openalex.org/W3019273456","https://openalex.org/W3041202696","https://openalex.org/W3103379718","https://openalex.org/W3122539908","https://openalex.org/W3168937714","https://openalex.org/W4214717370","https://openalex.org/W4243355778","https://openalex.org/W4247135518","https://openalex.org/W4249441547","https://openalex.org/W4285719527","https://openalex.org/W6607097208","https://openalex.org/W6611564366","https://openalex.org/W6630125228","https://openalex.org/W6638088447","https://openalex.org/W6680368475","https://openalex.org/W6684935223"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W4385188875","https://openalex.org/W4381586542","https://openalex.org/W2011837598","https://openalex.org/W1976294505","https://openalex.org/W2095960527","https://openalex.org/W4212806423"],"abstract_inverted_index":{"There":[0],"is":[1],"great":[2],"interest":[3],"in":[4],"building":[5],"intrinsic":[6,18,85,112],"motivation":[7,19],"into":[8],"artificial":[9],"systems":[10],"using":[11],"the":[12,54,93,101,118,121],"reinforcement":[13],"learning":[14],"framework.":[15],"Yet,":[16],"what":[17],"may":[20,26,81],"mean":[21],"computationally,":[22],"and":[23,34,45,86,92,108,113,126],"how":[24],"it":[25],"differ":[27],"from":[28],"extrinsic":[29,87,114],"motivation,":[30],"remains":[31],"a":[32,47,131],"murky":[33],"controversial":[35],"subject.":[36],"In":[37],"this":[38],"paper,":[39],"we":[40],"adopt":[41],"an":[42],"evolutionary":[43,65,90,127],"perspective":[44,91],"define":[46],"new":[48],"optimal":[49,77,95],"reward":[50,60,79,96,115],"framework":[51,97],"that":[52,62,76,103],"captures":[53],"pressure":[55],"to":[56,64,100],"design":[57],"good":[58],"primary":[59,78],"functions":[61],"lead":[63,99],"success":[66,128],"across":[67],"environments.":[68],"The":[69,89],"results":[70],"of":[71,120],"two":[72],"computational":[73],"experiments":[74],"show":[75],"signals":[80],"yield":[82],"both":[83],"emergent":[84],"motivation.":[88],"associated":[94],"thus":[98],"conclusion":[102],"there":[104],"are":[105],"no":[106],"hard":[107],"fast":[109],"features":[110],"distinguishing":[111],"computationally.":[116],"Rather,":[117],"directness":[119],"relationship":[122],"between":[123],"rewarding":[124],"behavior":[125],"varies":[129],"along":[130],"continuum.":[132]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":21},{"year":2023,"cited_by_count":30},{"year":2022,"cited_by_count":30},{"year":2021,"cited_by_count":54},{"year":2020,"cited_by_count":34},{"year":2019,"cited_by_count":40},{"year":2018,"cited_by_count":28},{"year":2017,"cited_by_count":17},{"year":2016,"cited_by_count":21},{"year":2015,"cited_by_count":14},{"year":2014,"cited_by_count":29},{"year":2013,"cited_by_count":26},{"year":2012,"cited_by_count":19}],"updated_date":"2026-04-22T08:38:42.863108","created_date":"2025-10-10T00:00:00"}
