{"id":"https://openalex.org/W6910786293","doi":"https://doi.org/10.48550/arxiv.2507.11482","title":"Illuminating the Three Dogmas of Reinforcement Learning under Evolutionary Light","display_name":"Illuminating the Three Dogmas of Reinforcement Learning under Evolutionary Light","publication_year":2025,"publication_date":"2025-07-15","ids":{"openalex":"https://openalex.org/W6910786293","doi":"https://doi.org/10.48550/arxiv.2507.11482"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2507.11482","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.11482","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2507.11482","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Hamidi, Mani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hamidi, Mani","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Deacon, Terrence W.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deacon, Terrence W.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11883","display_name":"Embodied and Extended Cognition","score":0.28700000047683716,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11883","display_name":"Embodied and Extended Cognition","score":0.28700000047683716,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.18240000307559967,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.14380000531673431,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6991999745368958},{"id":"https://openalex.org/keywords/agency","display_name":"Agency (philosophy)","score":0.5216000080108643},{"id":"https://openalex.org/keywords/sustenance","display_name":"Sustenance","score":0.5164999961853027},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.46810001134872437},{"id":"https://openalex.org/keywords/evolutionary-theory","display_name":"Evolutionary theory","score":0.44200000166893005},{"id":"https://openalex.org/keywords/artificial-life","display_name":"Artificial life","score":0.43790000677108765},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.3982999920845032},{"id":"https://openalex.org/keywords/evolutionary-dynamics","display_name":"Evolutionary dynamics","score":0.37959998846054077},{"id":"https://openalex.org/keywords/niche-construction","display_name":"Niche construction","score":0.35040000081062317}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6991999745368958},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.5539000034332275},{"id":"https://openalex.org/C108170787","wikidata":"https://www.wikidata.org/wiki/Q3951828","display_name":"Agency (philosophy)","level":2,"score":0.5216000080108643},{"id":"https://openalex.org/C2776351498","wikidata":"https://www.wikidata.org/wiki/Q1434188","display_name":"Sustenance","level":2,"score":0.5164999961853027},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.46810001134872437},{"id":"https://openalex.org/C2989147100","wikidata":"https://www.wikidata.org/wiki/Q1063","display_name":"Evolutionary theory","level":2,"score":0.44200000166893005},{"id":"https://openalex.org/C19273510","wikidata":"https://www.wikidata.org/wiki/Q263847","display_name":"Artificial life","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4036000072956085},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.38960000872612},{"id":"https://openalex.org/C171578705","wikidata":"https://www.wikidata.org/wiki/Q5418700","display_name":"Evolutionary dynamics","level":3,"score":0.37959998846054077},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.362199991941452},{"id":"https://openalex.org/C10437067","wikidata":"https://www.wikidata.org/wiki/Q1139192","display_name":"Niche construction","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3418999910354614},{"id":"https://openalex.org/C2988562018","wikidata":"https://www.wikidata.org/wiki/Q1063","display_name":"Biological evolution","level":2,"score":0.33799999952316284},{"id":"https://openalex.org/C199505168","wikidata":"https://www.wikidata.org/wiki/Q3267529","display_name":"Evolutionary robotics","level":3,"score":0.33649998903274536},{"id":"https://openalex.org/C72362118","wikidata":"https://www.wikidata.org/wiki/Q1356572","display_name":"Exaptation","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C92150231","wikidata":"https://www.wikidata.org/wiki/Q219695","display_name":"Evolutionary psychology","level":2,"score":0.3197000026702881},{"id":"https://openalex.org/C20249471","wikidata":"https://www.wikidata.org/wiki/Q2298789","display_name":"Evolutionary game theory","level":3,"score":0.311599999666214},{"id":"https://openalex.org/C137583809","wikidata":"https://www.wikidata.org/wiki/Q1096404","display_name":"Modern evolutionary synthesis","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C2776184637","wikidata":"https://www.wikidata.org/wiki/Q6506039","display_name":"Living systems","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2718000113964081},{"id":"https://openalex.org/C154848440","wikidata":"https://www.wikidata.org/wiki/Q1382559","display_name":"Evolutionary economics","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.2669000029563904},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C7955714","wikidata":"https://www.wikidata.org/wiki/Q12056630","display_name":"Structure and agency","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C92393732","wikidata":"https://www.wikidata.org/wiki/Q1790374","display_name":"Learning theory","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C196187386","wikidata":"https://www.wikidata.org/wiki/Q1050187","display_name":"Sociocultural evolution","level":2,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2507.11482","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.11482","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2507.11482","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.11482","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Three":[0],"core":[1],"tenets":[2],"of":[3,9,13,18,72,114,125,160,164,200],"reinforcement":[4,212],"learning":[5,213],"(RL)--concerning":[6],"the":[7,11,16,19,102,111,119,123,126,136,153,158,170,174,180,198],"definition":[8],"agency,":[10],"objective":[12],"learning,":[14,74],"and":[15,35,55,91,202,210],"scope":[17],"reward":[20,127,138],"hypothesis--have":[21],"been":[22],"highlighted":[23],"as":[24,69],"key":[25],"targets":[26],"for":[27,33,146,207],"conceptual":[28],"revision,":[29],"with":[30],"major":[31],"implications":[32,145],"theory":[34],"application.":[36],"We":[37,51,98,116,166,190],"propose":[38],"a":[39,70,161,187],"framework,":[40],"inspired":[41],"by":[42,100],"open-ended":[43],"evolutionary":[44,79,107,132,175],"theory,":[45,196],"to":[46,67,95,109,134,152],"reconsider":[47],"these":[48],"three":[49],"\"dogmas.\"":[50],"revisit":[52],"each":[53],"assumption":[54],"address":[56,118],"related":[57],"concerns":[58],"raised":[59],"alongside":[60],"them.":[61],"To":[62],"make":[63],"our":[64],"arguments":[65],"relevant":[66],"RL":[68],"model":[71],"biological":[73,215],"we":[75,150],"first":[76],"establish":[77],"that":[78,168],"dynamics":[80],"can":[81],"plausibly":[82],"operate":[83],"within":[84],"living":[85],"brains":[86],"over":[87],"an":[88],"individual's":[89],"lifetime,":[90],"are":[92],"not":[93],"confined":[94],"cross-generational":[96],"processes.":[97],"begin":[99],"revisiting":[101],"second":[103],"dogma,":[104],"drawing":[105],"on":[106],"insights":[108],"enrich":[110],"\"adaptation-rather-than-search\"":[112],"view":[113],"learning.":[115],"then":[117],"third":[120],"dogma":[121],"regarding":[122],"limits":[124],"hypothesis,":[128],"using":[129],"analogies":[130],"from":[131,194],"fitness":[133],"illuminate":[135],"scalar":[137],"vs.":[139],"multi-objective":[140],"debate.":[141],"After":[142],"discussing":[143],"practical":[144],"exploration":[147],"in":[148,186,214],"RL,":[149],"turn":[151],"first--and":[154],"arguably":[155],"most":[156],"fundamental--issue:":[157],"absence":[159],"formal":[162],"account":[163],"agency.":[165],"argue":[167],"unlike":[169],"other":[171],"two":[172],"problems,":[173],"paradigm":[176],"alone":[177],"cannot":[178],"resolve":[179],"agency":[181,209],"question,":[182],"though":[183],"it":[184],"gestures":[185],"productive":[188],"direction.":[189],"advocate":[191],"integrating":[192],"ideas":[193],"origins-of-life":[195],"where":[197],"thermodynamics":[199],"sustenance":[201],"replication":[203],"offer":[204],"promising":[205],"foundations":[206],"understanding":[208],"resource-constrained":[211],"systems.":[216]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
