{"id":"https://openalex.org/W3014466575","doi":"https://doi.org/10.1109/cog47356.2020.9231802","title":"Obstacle Tower Without Human Demonstrations: How Far a Deep Feed-Forward Network Goes with Reinforcement Learning","display_name":"Obstacle Tower Without Human Demonstrations: How Far a Deep Feed-Forward Network Goes with Reinforcement Learning","publication_year":2020,"publication_date":"2020-08-01","ids":{"openalex":"https://openalex.org/W3014466575","doi":"https://doi.org/10.1109/cog47356.2020.9231802","mag":"3014466575"},"language":"en","primary_location":{"id":"doi:10.1109/cog47356.2020.9231802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog47356.2020.9231802","pdf_url":null,"source":{"id":"https://openalex.org/S4306498668","display_name":"2020 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2004.00567","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056492267","display_name":"Marco Pleines","orcid":null},"institutions":[{"id":"https://openalex.org/I200332995","display_name":"TU Dortmund University","ror":"https://ror.org/01k97gp34","country_code":"DE","type":"education","lineage":["https://openalex.org/I200332995"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marco Pleines","raw_affiliation_strings":["Faculty of Computer Science, Technische Universit\u00e4t Dortmund, Dortmund, Germany","Technical University of Dortmund,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computer Science, Technische Universit\u00e4t Dortmund, Dortmund, Germany","institution_ids":["https://openalex.org/I200332995"]},{"raw_affiliation_string":"Technical University of Dortmund,","institution_ids":["https://openalex.org/I200332995"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085870953","display_name":"Jenia Jitsev","orcid":"https://orcid.org/0000-0002-1221-7851"},"institutions":[{"id":"https://openalex.org/I171892758","display_name":"Forschungszentrum J\u00fclich","ror":"https://ror.org/02nv7yv05","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I171892758"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jenia Jitsev","raw_affiliation_strings":["Juelich Supercomputing Center (JSC), Helmholtz Research Center Juelich, Juelich, Germany","Forschungszentrum Julich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Juelich Supercomputing Center (JSC), Helmholtz Research Center Juelich, Juelich, Germany","institution_ids":["https://openalex.org/I171892758"]},{"raw_affiliation_string":"Forschungszentrum Julich","institution_ids":["https://openalex.org/I171892758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062774048","display_name":"Mike Preu\u00df","orcid":"https://orcid.org/0000-0003-4681-1346"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mike Preuss","raw_affiliation_strings":["LIACS, Universiteit Leiden, Leiden, NL","Leiden University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LIACS, Universiteit Leiden, Leiden, NL","institution_ids":["https://openalex.org/I121797337"]},{"raw_affiliation_string":"Leiden University","institution_ids":["https://openalex.org/I121797337"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017449879","display_name":"Fr\u00e4nk Zimmer","orcid":null},"institutions":[{"id":"https://openalex.org/I70865968","display_name":"Rhine-Waal University of Applied Sciences","ror":"https://ror.org/04wdt0z89","country_code":"DE","type":"education","lineage":["https://openalex.org/I70865968"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Frank Zimmer","raw_affiliation_strings":["Faculty of Communication and Environment, Hochschule Rhein-Waal, Kamp-Lintfort, Germany","Hochschule Rhein-Waal,Faculty of Communication and Environment,Kamp-Lintfort,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Communication and Environment, Hochschule Rhein-Waal, Kamp-Lintfort, Germany","institution_ids":["https://openalex.org/I70865968"]},{"raw_affiliation_string":"Hochschule Rhein-Waal,Faculty of Communication and Environment,Kamp-Lintfort,Germany","institution_ids":["https://openalex.org/I70865968"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1115,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.35853954,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"80","issue":null,"first_page":"447","last_page":"454"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7590023279190063},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7114592790603638},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.710374653339386},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.6587153673171997},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6570187211036682},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.6545068621635437},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5681252479553223},{"id":"https://openalex.org/keywords/competition","display_name":"Competition (biology)","score":0.5288428068161011},{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.5118783712387085},{"id":"https://openalex.org/keywords/tower","display_name":"Tower","score":0.47444164752960205},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3828935921192169},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.34498414397239685},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16690361499786377},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1277061402797699},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07559573650360107},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07359415292739868}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7590023279190063},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7114592790603638},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.710374653339386},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.6587153673171997},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6570187211036682},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.6545068621635437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5681252479553223},{"id":"https://openalex.org/C91306197","wikidata":"https://www.wikidata.org/wiki/Q45767","display_name":"Competition (biology)","level":2,"score":0.5288428068161011},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.5118783712387085},{"id":"https://openalex.org/C2777831296","wikidata":"https://www.wikidata.org/wiki/Q12518","display_name":"Tower","level":2,"score":0.47444164752960205},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3828935921192169},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.34498414397239685},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16690361499786377},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1277061402797699},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07559573650360107},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07359415292739868},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C147176958","wikidata":"https://www.wikidata.org/wiki/Q77590","display_name":"Civil engineering","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/cog47356.2020.9231802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog47356.2020.9231802","pdf_url":null,"source":{"id":"https://openalex.org/S4306498668","display_name":"2020 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2004.00567","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2004.00567","pdf_url":"https://arxiv.org/pdf/2004.00567","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2004.00567","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2004.00567","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:3014466575","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2004.00567","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2004.00567","pdf_url":"https://arxiv.org/pdf/2004.00567","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3014466575.pdf","grobid_xml":"https://content.openalex.org/works/W3014466575.grobid-xml"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W1506806321","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2150468603","https://openalex.org/W2194775991","https://openalex.org/W2534314849","https://openalex.org/W2626778328","https://openalex.org/W2736601468","https://openalex.org/W2810602713","https://openalex.org/W2891790128","https://openalex.org/W2903181768","https://openalex.org/W2914898814","https://openalex.org/W2960384012","https://openalex.org/W2962832483","https://openalex.org/W2963369679","https://openalex.org/W2963390419","https://openalex.org/W2963948533","https://openalex.org/W2966556569","https://openalex.org/W2970214542","https://openalex.org/W2970567787","https://openalex.org/W2973136764","https://openalex.org/W2973525135","https://openalex.org/W2982316857","https://openalex.org/W2994073215","https://openalex.org/W2996037775","https://openalex.org/W2999617596","https://openalex.org/W3103780890","https://openalex.org/W6692846177","https://openalex.org/W6739901393","https://openalex.org/W6741002519","https://openalex.org/W6744991969","https://openalex.org/W6746605513","https://openalex.org/W6748638692","https://openalex.org/W6750629867","https://openalex.org/W6754521519","https://openalex.org/W6756840741","https://openalex.org/W6757358677","https://openalex.org/W6765479255","https://openalex.org/W6767141496","https://openalex.org/W6767810603","https://openalex.org/W6767919266","https://openalex.org/W6769580333","https://openalex.org/W6771740491","https://openalex.org/W6771750343","https://openalex.org/W6772005887"],"related_works":["https://openalex.org/W2952991114","https://openalex.org/W2774719390","https://openalex.org/W3179916441","https://openalex.org/W1541535141","https://openalex.org/W2079037041","https://openalex.org/W2330409864","https://openalex.org/W3008890934","https://openalex.org/W3092361584","https://openalex.org/W2497427749","https://openalex.org/W3207459740","https://openalex.org/W2091618667","https://openalex.org/W2765412282","https://openalex.org/W148370670","https://openalex.org/W2788162021","https://openalex.org/W19223795","https://openalex.org/W3136024375","https://openalex.org/W2591550704","https://openalex.org/W3082535795","https://openalex.org/W2491558291","https://openalex.org/W2721289608"],"abstract_inverted_index":{"The":[0],"Obstacle":[1],"Tower":[2],"Challenge":[3],"is":[4,134,161],"the":[5,22,43,77,81,96,101,156],"task":[6,158],"to":[7,19,37,40,126,128,146],"master":[8],"a":[9,66,113,129,137],"procedurally":[10],"generated":[11],"chain":[12],"of":[13,27,61,80,132],"levels":[14],"that":[15,49,91,107,142],"subsequently":[16],"get":[17],"harder":[18],"complete.":[20],"Whereas":[21],"most":[23],"top":[24],"performing":[25],"entries":[26],"last":[28],"year's":[29],"competition":[30],"used":[31],"human":[32],"demonstrations":[33],"or":[34],"reward":[35],"shaping":[36],"learn":[38],"how":[39],"cope":[41],"with":[42,65,136],"challenge,":[44],"we":[45,124],"present":[46],"an":[47],"approach":[48,83,109],"performed":[50],"competitively":[51],"(placed":[52],"7th)":[53],"but":[54],"starts":[55],"completely":[56],"from":[57],"scratch":[58],"by":[59],"means":[60],"Deep":[62],"Reinforcement":[63],"Learning":[64],"relatively":[67,138],"simple":[68],"feed-forward":[69],"deep":[70],"network":[71],"structure.":[72],"We":[73],"especially":[74],"look":[75],"at":[76],"generalization":[78],"performance":[79],"taken":[82],"concerning":[84],"different":[85],"seeds":[86],"and":[87,98,104],"various":[88],"visual":[89,153],"themes":[90],"have":[92],"become":[93],"available":[94],"after":[95],"competition,":[97],"investigate":[99],"where":[100,155],"agent":[102],"fails":[103],"why.":[105],"Note":[106],"our":[108],"does":[110],"not":[111],"possess":[112],"short-term":[114],"memory":[115],"like":[116],"employing":[117],"recurrent":[118],"hidden":[119],"states.":[120],"With":[121],"this":[122],"work,":[123],"hope":[125],"contribute":[127],"better":[130],"understanding":[131],"what":[133],"possible":[135],"simple,":[139],"flexible":[140],"solution":[141],"can":[143],"be":[144],"applied":[145],"learning":[147],"in":[148],"environments":[149],"featuring":[150],"complex":[151],"3D":[152],"input":[154],"abstract":[157],"structure":[159],"itself":[160],"still":[162],"fairly":[163],"simple.":[164]},"counts_by_year":[{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
