{"id":"https://openalex.org/W2791696004","doi":"https://doi.org/10.1109/cig.2018.8490448","title":"Automated Curriculum Learning by Rewarding Temporally Rare Events","display_name":"Automated Curriculum Learning by Rewarding Temporally Rare Events","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2791696004","doi":"https://doi.org/10.1109/cig.2018.8490448","mag":"2791696004"},"language":"en","primary_location":{"id":"doi:10.1109/cig.2018.8490448","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cig.2018.8490448","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE Conference on Computational Intelligence and Games (CIG)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://pure.itu.dk/portal/da/publications/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043102938","display_name":"Niels Justesen","orcid":"https://orcid.org/0000-0001-5381-5498"},"institutions":[{"id":"https://openalex.org/I83467386","display_name":"IT University of Copenhagen","ror":"https://ror.org/02309jg23","country_code":"DK","type":"education","lineage":["https://openalex.org/I83467386"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Niels Justesen","raw_affiliation_strings":["IT University of Copenhagen, Copenhagen, Denmark","[IT University of Copenhagen, Copenhagen, Denmark]"],"affiliations":[{"raw_affiliation_string":"IT University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I83467386"]},{"raw_affiliation_string":"[IT University of Copenhagen, Copenhagen, Denmark]","institution_ids":["https://openalex.org/I83467386"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020511097","display_name":"Sebastian Risi","orcid":"https://orcid.org/0000-0003-3607-8400"},"institutions":[{"id":"https://openalex.org/I83467386","display_name":"IT University of Copenhagen","ror":"https://ror.org/02309jg23","country_code":"DK","type":"education","lineage":["https://openalex.org/I83467386"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Sebastian Risi","raw_affiliation_strings":["IT University of Copenhagen, Copenhagen, Denmark","[IT University of Copenhagen, Copenhagen, Denmark]"],"affiliations":[{"raw_affiliation_string":"IT University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I83467386"]},{"raw_affiliation_string":"[IT University of Copenhagen, Copenhagen, Denmark]","institution_ids":["https://openalex.org/I83467386"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5043102938"],"corresponding_institution_ids":["https://openalex.org/I83467386"],"apc_list":null,"apc_paid":null,"fwci":0.39712492,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.65544261,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9833999872207642,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7735906839370728},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7220795750617981},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6110211610794067},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5597408413887024},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.5373062491416931},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4779786467552185},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35289663076400757},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35073578357696533},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.3227250277996063},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2635209560394287}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7735906839370728},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7220795750617981},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6110211610794067},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5597408413887024},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.5373062491416931},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4779786467552185},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35289663076400757},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35073578357696533},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3227250277996063},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2635209560394287},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/cig.2018.8490448","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cig.2018.8490448","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE Conference on Computational Intelligence and Games (CIG)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","is_oa":true,"landing_page_url":"https://pure.itu.dk/portal/da/publications/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","pdf_url":null,"source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Justesen, N & Risi, S 2018, Automated Curriculum Learning by Rewarding Temporally Rare Events. in 2018 IEEE Conference on Computational Intelligence and Games. IEEE, pp. 293-300. < https://arxiv.org/pdf/1803.07131.pdf >","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:arXiv.org:1803.07131","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1803.07131","pdf_url":"https://arxiv.org/pdf/1803.07131","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2791696004","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1803.07131","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:pure.atira.dk:publications/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1803.07131.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4377196680","display_name":"IT University Of Copenhagen (IT University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I83467386","host_organization_name":"IT University of Copenhagen","host_organization_lineage":["https://openalex.org/I83467386"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Justesen, N & Risi, S 2018, Automated Curriculum Learning by Rewarding Temporally Rare Events. in 2018 IEEE Conference on Computational Intelligence and Games. IEEE, pp. 293-300. < https://arxiv.org/pdf/1803.07131.pdf >","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"doi:10.48550/arxiv.1803.07131","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1803.07131","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","is_oa":true,"landing_page_url":"https://pure.itu.dk/portal/da/publications/0eaa5511-f8a3-4b04-88e6-85fb89437c0d","pdf_url":null,"source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Justesen, N & Risi, S 2018, Automated Curriculum Learning by Rewarding Temporally Rare Events. in 2018 IEEE Conference on Computational Intelligence and Games. IEEE, pp. 293-300. < https://arxiv.org/pdf/1803.07131.pdf >","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5400000214576721,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320319918","display_name":"York University","ror":"https://ror.org/05fq50484"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W142858861","https://openalex.org/W758372786","https://openalex.org/W1130790960","https://openalex.org/W1560435054","https://openalex.org/W1674110665","https://openalex.org/W1763311249","https://openalex.org/W1966114254","https://openalex.org/W2000514530","https://openalex.org/W2034806191","https://openalex.org/W2077287406","https://openalex.org/W2079246448","https://openalex.org/W2113122939","https://openalex.org/W2116386744","https://openalex.org/W2145339207","https://openalex.org/W2151083897","https://openalex.org/W2160589914","https://openalex.org/W2170899200","https://openalex.org/W2171658832","https://openalex.org/W2296073425","https://openalex.org/W2335959470","https://openalex.org/W2362143032","https://openalex.org/W2417089653","https://openalex.org/W2419612459","https://openalex.org/W2462548332","https://openalex.org/W2522489477","https://openalex.org/W2550182557","https://openalex.org/W2558518165","https://openalex.org/W2596367596","https://openalex.org/W2604268026","https://openalex.org/W2733961795","https://openalex.org/W2735796404","https://openalex.org/W2736601468","https://openalex.org/W2749807327","https://openalex.org/W2749928749","https://openalex.org/W2751516180","https://openalex.org/W2753316839","https://openalex.org/W2778749116","https://openalex.org/W2789073708","https://openalex.org/W2950471160","https://openalex.org/W2951948137","https://openalex.org/W2952578114","https://openalex.org/W2952791429","https://openalex.org/W2963523627","https://openalex.org/W2963871073","https://openalex.org/W2964043796","https://openalex.org/W2964282857","https://openalex.org/W4212793374","https://openalex.org/W4300107936","https://openalex.org/W6605846256","https://openalex.org/W6622219343","https://openalex.org/W6650587873","https://openalex.org/W6682441423","https://openalex.org/W6683436435","https://openalex.org/W6692846177","https://openalex.org/W6696324988","https://openalex.org/W6703271639","https://openalex.org/W6711864727","https://openalex.org/W6716653466","https://openalex.org/W6717230150","https://openalex.org/W6727252785","https://openalex.org/W6729433768","https://openalex.org/W6729788943","https://openalex.org/W6729796140","https://openalex.org/W6731334075","https://openalex.org/W6735641298","https://openalex.org/W6736309856","https://openalex.org/W6736742618","https://openalex.org/W6740801417","https://openalex.org/W6741002519","https://openalex.org/W6743756900","https://openalex.org/W6743802245","https://openalex.org/W6744502524","https://openalex.org/W6746622358","https://openalex.org/W6780324855","https://openalex.org/W7034091645"],"related_works":["https://openalex.org/W2963473082","https://openalex.org/W2998135952","https://openalex.org/W3034558260","https://openalex.org/W3111373512","https://openalex.org/W1753708795","https://openalex.org/W2964654516","https://openalex.org/W2998312465","https://openalex.org/W2166494941","https://openalex.org/W1607218107","https://openalex.org/W2400719195","https://openalex.org/W2949969799","https://openalex.org/W2996110979","https://openalex.org/W1130790960","https://openalex.org/W1453801241","https://openalex.org/W2986106408","https://openalex.org/W2950172727","https://openalex.org/W3034769194","https://openalex.org/W2726187156","https://openalex.org/W3022312285","https://openalex.org/W3152069551"],"abstract_inverted_index":{"Reward":[0],"shaping":[1],"allows":[2],"reinforcement":[3],"learning":[4,9,85],"(RL)":[5],"agents":[6],"to":[7,21,62,90,108,116,137],"accelerate":[8],"by":[10,43,93,159],"receiving":[11],"additional":[12],"reward":[13,39,76,119],"signals.":[14],"However,":[15],"these":[16],"signals":[17],"can":[18],"be":[19,91],"difficult":[20],"design":[22],"manually,":[23],"especially":[24],"for":[25],"complex":[26],"RL":[27,154],"tasks.":[28],"We":[29,96],"propose":[30],"a":[31,80,130,164],"simple":[32],"and":[33],"general":[34],"approach":[35,104],"that":[36,86,98,127,134,156],"determines":[37],"the":[38,60,94,106,117,121,124,141],"of":[40,67,74,82,101,166],"pre-defined":[41],"events":[42,48,68,144],"their":[44,147],"rarity":[45,148],"alone.":[46],"Here":[47],"become":[49],"less":[50],"rewarding":[51],"as":[52,69],"they":[53],"are":[54,157],"experienced":[55],"more":[56,131],"often,":[57],"which":[58],"encourages":[59],"agent":[61,107],"continually":[63],"explore":[64],"new":[65],"types":[66],"it":[70],"learns.":[71],"The":[72],"adaptiveness":[73],"this":[75,99],"function":[77],"results":[78,125],"in":[79,110,140,151],"form":[81],"automated":[83],"curriculum":[84],"does":[87],"not":[88],"have":[89],"specified":[92],"experimenter.":[95],"demonstrate":[97,126],"\\emph{Rarity":[100],"Events}":[102],"(RoE)":[103],"enables":[105],"succeed":[109],"challenging":[111],"VizDoom":[112],"scenarios":[113],"without":[114],"access":[115],"extrinsic":[118,161],"from":[120],"environment.":[122,142],"Furthermore,":[123],"RoE":[128],"learns":[129],"versatile":[132],"policy":[133],"adapts":[135],"well":[136],"critical":[138],"changes":[139],"Rewarding":[143],"based":[145],"on":[146],"could":[149],"help":[150],"many":[152],"unsolved":[153],"environments":[155],"characterized":[158],"sparse":[160],"rewards":[162],"but":[163],"plethora":[165],"known":[167],"event":[168],"types.":[169]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
