{"id":"https://openalex.org/W2107992190","doi":"https://doi.org/10.1109/cec.2011.5949655","title":"Revisiting the Acrobot &amp;#x2018;height&amp;#x2019; task: An example of efficient evolutionary policy search under an episodic goal seeking task","display_name":"Revisiting the Acrobot &amp;#x2018;height&amp;#x2019; task: An example of efficient evolutionary policy search under an episodic goal seeking task","publication_year":2011,"publication_date":"2011-06-01","ids":{"openalex":"https://openalex.org/W2107992190","doi":"https://doi.org/10.1109/cec.2011.5949655","mag":"2107992190"},"language":"en","primary_location":{"id":"doi:10.1109/cec.2011.5949655","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cec.2011.5949655","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Congress of Evolutionary Computation (CEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015078188","display_name":"John A. Doucette","orcid":"https://orcid.org/0000-0003-4916-6258"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"John Doucette","raw_affiliation_strings":["Department of Computer Science, Waterloo University, ONT, Canada","Department of Computer Science, Waterloo University, ON. Canada"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Waterloo University, ONT, Canada","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"Department of Computer Science, Waterloo University, ON. Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003699164","display_name":"Malcolm I. Heywood","orcid":"https://orcid.org/0000-0002-1521-0671"},"institutions":[{"id":"https://openalex.org/I129902397","display_name":"Dalhousie University","ror":"https://ror.org/01e6qks80","country_code":"CA","type":"education","lineage":["https://openalex.org/I129902397"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Malcolm I. Heywood","raw_affiliation_strings":["Faculty of Computer Science, Dalhousie University, Halifax, NS, Canada","[Faculty of Computer Science, Dalhousie University, Halifax, NS, Canada]"],"affiliations":[{"raw_affiliation_string":"Faculty of Computer Science, Dalhousie University, Halifax, NS, Canada","institution_ids":["https://openalex.org/I129902397"]},{"raw_affiliation_string":"[Faculty of Computer Science, Dalhousie University, Halifax, NS, Canada]","institution_ids":["https://openalex.org/I129902397"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5015078188"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":1.2827,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.84093794,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"9","issue":null,"first_page":"468","last_page":"475"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6680915355682373},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6546261310577393},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6299002170562744},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.5873143076896667},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5845296382904053},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.519555389881134},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.5119792222976685},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5011320114135742},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.47877824306488037},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4479526877403259},{"id":"https://openalex.org/keywords/evolutionary-computation","display_name":"Evolutionary computation","score":0.44342130422592163},{"id":"https://openalex.org/keywords/genetic-algorithm","display_name":"Genetic algorithm","score":0.42931652069091797},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4146215319633484},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3878452181816101},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1835000216960907},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.1328166425228119},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.10867691040039062}],"concepts":[{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6680915355682373},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6546261310577393},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6299002170562744},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.5873143076896667},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5845296382904053},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.519555389881134},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.5119792222976685},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5011320114135742},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.47877824306488037},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4479526877403259},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.44342130422592163},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.42931652069091797},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4146215319633484},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3878452181816101},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1835000216960907},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.1328166425228119},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.10867691040039062},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cec.2011.5949655","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cec.2011.5949655","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Congress of Evolutionary Computation (CEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1583031142","https://openalex.org/W1914583973","https://openalex.org/W1983384754","https://openalex.org/W1984987629","https://openalex.org/W2018500972","https://openalex.org/W2058843673","https://openalex.org/W2089052147","https://openalex.org/W2098879935","https://openalex.org/W2100948575","https://openalex.org/W2107726111","https://openalex.org/W2111935653","https://openalex.org/W2121863487","https://openalex.org/W2142484475","https://openalex.org/W2142592520","https://openalex.org/W2148067905","https://openalex.org/W2154022540","https://openalex.org/W2163467402","https://openalex.org/W2285110183","https://openalex.org/W2492412168","https://openalex.org/W2610826712","https://openalex.org/W2997026295","https://openalex.org/W4214717370","https://openalex.org/W4232217679","https://openalex.org/W4253354958","https://openalex.org/W6640071088","https://openalex.org/W6675078049","https://openalex.org/W6676007687","https://openalex.org/W6681804199","https://openalex.org/W6682701150","https://openalex.org/W6696157080"],"related_works":["https://openalex.org/W2130703626","https://openalex.org/W4297582752","https://openalex.org/W4285805405","https://openalex.org/W2391924736","https://openalex.org/W3133779647","https://openalex.org/W1560122427","https://openalex.org/W1993493607","https://openalex.org/W2021957875","https://openalex.org/W2802808995","https://openalex.org/W2787833928"],"abstract_inverted_index":{"Evolutionary":[0],"methods":[1],"for":[2,63,112],"addressing":[3],"the":[4,27,30,48,82,89,164,169],"temporal":[5],"sequence":[6],"learning":[7],"problem":[8],"generally":[9],"fall":[10],"into":[11],"policy":[12,31,102,125],"search":[13,32,126],"as":[14,147,149],"opposed":[15],"to":[16,52,76,88,96],"value":[17,154],"function":[18,155],"optimization":[19],"approaches.":[20],"Various":[21],"re":[22],"cent":[23],"results":[24],"have":[25,60],"made":[26],"claim":[28],"that":[29,70],"approach":[33],"is":[34,50,74,119,159],"at":[35,38],"best":[36],"inefficient":[37],"solving":[39],"episodic":[40],"'goal":[41],"seeking'":[42],"tasks":[43,45],"i.e.,":[44],"under":[46,142],"which":[47],"reward":[49],"limited":[51],"describing":[53],"properties":[54],"associated":[55],"with":[56],"a":[57,72,77,106,114],"successful":[58],"outcome":[59],"no":[61],"qualification":[62],"degrees":[64],"of":[65,79,116,131],"failure.":[66],"This":[67,104],"work":[68],"demonstrates":[69,145],"such":[71],"conclusion":[73],"due":[75],"lack":[78],"diversity":[80],"in":[81,100],"training":[83,117],"scenarios.":[84],"We":[85],"therefore":[86],"return":[87],"Acrobot":[90],"'height'":[91],"task":[92],"domain":[93],"originally":[94],"used":[95],"demonstrate":[97],"complete":[98],"failure":[99],"evolutionary":[101,124],"search.":[103],"time":[105],"very":[107],"simple":[108],"stochastic":[109],"sampling":[110],"heuristic":[111],"defining":[113],"population":[115],"configurations":[118],"introduced.":[120],"Benchmarking":[121],"two":[122],"recent":[123],"algorithms":[127],"-":[128,141],"Neural":[129],"Evolution":[130],"Augmented":[132],"Topologies":[133],"(NEAT)":[134],"and":[135],"Symbiotic":[136],"Bid-Based":[137],"(SBB)":[138],"Genetic":[139],"Programming":[140],"this":[143,158],"condition":[144],"solutions":[146],"effective":[148],"those":[150],"returned":[151],"by":[152,168],"advanced":[153],"methods.":[156],"Moreover":[157],"achieved":[160],"while":[161],"remaining":[162],"within":[163],"evaluation":[165],"limit":[166],"imposed":[167],"original":[170],"study.":[171]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
