{"id":"https://openalex.org/W3091795298","doi":"https://doi.org/10.1109/tnnls.2022.3160173","title":"Instance Weighted Incremental Evolution Strategies for Reinforcement Learning in Dynamic Environments","display_name":"Instance Weighted Incremental Evolution Strategies for Reinforcement Learning in Dynamic Environments","publication_year":2022,"publication_date":"2022-03-29","ids":{"openalex":"https://openalex.org/W3091795298","doi":"https://doi.org/10.1109/tnnls.2022.3160173","mag":"3091795298","pmid":"https://pubmed.ncbi.nlm.nih.gov/35349452"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2022.3160173","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3160173","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2010.04605","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100376415","display_name":"Zhi Wang","orcid":"https://orcid.org/0000-0003-0304-3965"},"institutions":[{"id":"https://openalex.org/I188329596","display_name":"University of Canberra","ror":"https://ror.org/04s1nv328","country_code":"AU","type":"education","lineage":["https://openalex.org/I188329596"]},{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["AU","CN"],"is_corresponding":true,"raw_author_name":"Zhi Wang","raw_affiliation_strings":["Department of Control and Systems Engineering, Nanjing University, Nanjing, China","School of Engineering and Information Technology, University of New South Wales, Canberra, ACT, Australia"],"affiliations":[{"raw_affiliation_string":"Department of Control and Systems Engineering, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"School of Engineering and Information Technology, University of New South Wales, Canberra, ACT, Australia","institution_ids":["https://openalex.org/I188329596","https://openalex.org/I31746571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100697167","display_name":"Chunlin Chen","orcid":"https://orcid.org/0000-0003-3929-4707"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunlin Chen","raw_affiliation_strings":["Department of Control and Systems Engineering, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Control and Systems Engineering, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000582423","display_name":"Daoyi Dong","orcid":"https://orcid.org/0000-0002-7425-3559"},"institutions":[{"id":"https://openalex.org/I188329596","display_name":"University of Canberra","ror":"https://ror.org/04s1nv328","country_code":"AU","type":"education","lineage":["https://openalex.org/I188329596"]},{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Daoyi Dong","raw_affiliation_strings":["School of Engineering and Information Technology, University of New South Wales, Canberra, ACT, Australia"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Information Technology, University of New South Wales, Canberra, ACT, Australia","institution_ids":["https://openalex.org/I188329596","https://openalex.org/I31746571"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100376415"],"corresponding_institution_ids":["https://openalex.org/I188329596","https://openalex.org/I31746571","https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":2.0823,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.88441361,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"34","issue":"12","first_page":"9742","last_page":"9756"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8455126285552979},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8086063861846924},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7520785331726074},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6197762489318848},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.6078059673309326},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5832988619804382},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5583330988883972},{"id":"https://openalex.org/keywords/incremental-learning","display_name":"Incremental learning","score":0.5017766952514648},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46876734495162964}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8455126285552979},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8086063861846924},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7520785331726074},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6197762489318848},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.6078059673309326},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5832988619804382},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5583330988883972},{"id":"https://openalex.org/C2780735816","wikidata":"https://www.wikidata.org/wiki/Q28324931","display_name":"Incremental learning","level":2,"score":0.5017766952514648},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46876734495162964},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2022.3160173","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3160173","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:35349452","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35349452","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:arXiv.org:2010.04605","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2010.04605","pdf_url":"https://arxiv.org/pdf/2010.04605","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2010.04605","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2010.04605","pdf_url":"https://arxiv.org/pdf/2010.04605","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3174144325","display_name":null,"funder_award_id":"DP190101566","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"},{"id":"https://openalex.org/G4904587412","display_name":null,"funder_award_id":"62006111","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6081884918","display_name":null,"funder_award_id":"BK20200330","funder_id":"https://openalex.org/F4320322769","funder_display_name":"Natural Science Foundation of Jiangsu Province"},{"id":"https://openalex.org/G7996831764","display_name":null,"funder_award_id":"62073160","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322769","display_name":"Natural Science Foundation of Jiangsu Province","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":76,"referenced_works":["https://openalex.org/W1498178627","https://openalex.org/W1674110665","https://openalex.org/W1985602045","https://openalex.org/W1994955764","https://openalex.org/W2032277247","https://openalex.org/W2059654640","https://openalex.org/W2101524054","https://openalex.org/W2117539524","https://openalex.org/W2118556122","https://openalex.org/W2119717200","https://openalex.org/W2121863487","https://openalex.org/W2124175081","https://openalex.org/W2139047213","https://openalex.org/W2145339207","https://openalex.org/W2147585405","https://openalex.org/W2149933564","https://openalex.org/W2151083897","https://openalex.org/W2151965738","https://openalex.org/W2158782408","https://openalex.org/W2160512933","https://openalex.org/W2259258048","https://openalex.org/W2462102501","https://openalex.org/W2583496274","https://openalex.org/W2596367596","https://openalex.org/W2604763608","https://openalex.org/W2605102758","https://openalex.org/W2766447205","https://openalex.org/W2767050701","https://openalex.org/W2789543555","https://openalex.org/W2791387407","https://openalex.org/W2792645523","https://openalex.org/W2803180393","https://openalex.org/W2889970038","https://openalex.org/W2898585845","https://openalex.org/W2904998808","https://openalex.org/W2912681837","https://openalex.org/W2955616331","https://openalex.org/W2960705509","https://openalex.org/W2962974944","https://openalex.org/W2963305465","https://openalex.org/W2963446085","https://openalex.org/W2963614114","https://openalex.org/W2963641140","https://openalex.org/W2963790038","https://openalex.org/W2963859851","https://openalex.org/W2964043796","https://openalex.org/W2964227899","https://openalex.org/W2965407115","https://openalex.org/W2966477753","https://openalex.org/W2969189176","https://openalex.org/W2990747716","https://openalex.org/W2995627493","https://openalex.org/W2999912861","https://openalex.org/W3007384386","https://openalex.org/W3046093665","https://openalex.org/W3099100043","https://openalex.org/W3101442004","https://openalex.org/W4214717370","https://openalex.org/W6678114464","https://openalex.org/W6682132143","https://openalex.org/W6682262322","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6704571135","https://openalex.org/W6713348437","https://openalex.org/W6735641298","https://openalex.org/W6736057607","https://openalex.org/W6739193204","https://openalex.org/W6747092830","https://openalex.org/W6748317118","https://openalex.org/W6751617248","https://openalex.org/W6754782557","https://openalex.org/W6755353450","https://openalex.org/W6755903938","https://openalex.org/W6756463683","https://openalex.org/W6768560635"],"related_works":["https://openalex.org/W2381242807","https://openalex.org/W3126131230","https://openalex.org/W2347541121","https://openalex.org/W2080951048","https://openalex.org/W4288804799","https://openalex.org/W3032237421","https://openalex.org/W2390346111","https://openalex.org/W3011883280","https://openalex.org/W2369082698","https://openalex.org/W2401808953"],"abstract_inverted_index":{"Evolution":[0],"strategies":[1,170],"(ESs),":[2],"as":[3,12,22],"a":[4,13,48,67,193],"family":[5,194],"of":[6,91,118,195],"black-box":[7],"optimization":[8],"algorithms,":[9],"recently":[10],"emerge":[11],"scalable":[14,196],"alternative":[15],"to":[16,40,61,66,83,100,112,126,153,174,187,207],"reinforcement":[17],"learning":[18,51,86,205],"(RL)":[19],"approaches":[20],"such":[21],"Q-learning":[23],"or":[24],"policy":[25,65],"gradient":[26],"and":[27,132],"are":[28,37,98],"much":[29],"faster":[30],"when":[31],"many":[32],"central":[33],"processing":[34],"units":[35],"(CPUs)":[36],"available":[38],"due":[39],"better":[41],"parallelization.":[42],"In":[43],"this":[44],"article,":[45],"we":[46],"propose":[47,122],"systematic":[49],"incremental":[50,168],"method":[52],"for":[53,199],"ES":[54,82,197],"in":[55,145,159],"dynamic":[56,208],"environments.":[57,209],"The":[58,163],"goal":[59],"is":[60,172],"adjust":[62],"previously":[63],"learned":[64],"new":[68,105,115,161],"one":[69],"incrementally":[70],"whenever":[71],"the":[72,109,128,142,146,160],"environment":[73],"changes.":[74],"We":[75,121],"incorporate":[76],"an":[77,138,156],"instance":[78,130,133,150,157,166],"weighting":[79],"mechanism":[80],"with":[81],"facilitate":[84],"its":[85],"adaptation":[87,206],"while":[88,149],"retaining":[89],"scalability":[90],"ES.":[92],"During":[93],"parameter":[94,119],"updating,":[95],"higher":[96],"weights":[97],"assigned":[99],"instances":[101],"that":[102,202],"contain":[103],"more":[104],"knowledge,":[106],"thus":[107,191],"encouraging":[108],"search":[110],"distribution":[111],"move":[113],"toward":[114],"promising":[116],"areas":[117],"space.":[120],"two":[123],"easy-to-implement":[124],"metrics":[125],"calculate":[127],"weights:":[129],"novelty":[131,136],"quality.":[134],"Instance":[135],"measures":[137],"instance's":[139],"difference":[140],"from":[141,184],"previous":[143],"optimum":[144],"original":[147],"environment,":[148],"quality":[151],"corresponds":[152],"how":[154],"well":[155],"performs":[158],"environment.":[162],"resulting":[164],"algorithm,":[165],"weighted":[167],"evolution":[169],"(IW-IESs),":[171],"verified":[173],"achieve":[175],"significantly":[176],"improved":[177],"performance":[178],"on":[179],"challenging":[180],"RL":[181,200],"tasks":[182],"ranging":[183],"robot":[185],"navigation":[186],"locomotion.":[188],"This":[189],"article":[190],"introduces":[192],"algorithms":[198],"domains":[201],"enables":[203],"rapid":[204]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-10-10T00:00:00"}
