{"id":"https://openalex.org/W1983060704","doi":"https://doi.org/10.1109/itw.2010.5593329","title":"Modular Reinforcement Learning architectures for artificially intelligent agents in complex game environments","display_name":"Modular Reinforcement Learning architectures for artificially intelligent agents in complex game environments","publication_year":2010,"publication_date":"2010-08-01","ids":{"openalex":"https://openalex.org/W1983060704","doi":"https://doi.org/10.1109/itw.2010.5593329","mag":"1983060704"},"language":"en","primary_location":{"id":"doi:10.1109/itw.2010.5593329","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itw.2010.5593329","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2010 IEEE Conference on Computational Intelligence and Games","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050200143","display_name":"Christopher J. Hanna","orcid":null},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Christopher J. Hanna","raw_affiliation_strings":["Computing and Information Engineering, University of Ulster, Londonderry, UK","School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing and Information Engineering, University of Ulster, Londonderry, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112832072","display_name":"Raymond J. Hickey","orcid":null},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Raymond J. Hickey","raw_affiliation_strings":["Computing and Information Engineering, University of Ulster, Londonderry, UK","School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing and Information Engineering, University of Ulster, Londonderry, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053724421","display_name":"Darryl Charles","orcid":"https://orcid.org/0000-0002-8546-6066"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Darryl K. Charles","raw_affiliation_strings":["Computing and Information Engineering, University of Ulster, Londonderry, UK","School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing and Information Engineering, University of Ulster, Londonderry, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077309331","display_name":"Michaela Black","orcid":"https://orcid.org/0000-0002-5140-2566"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Michaela M. Black","raw_affiliation_strings":["Computing and Information Engineering, University of Ulster, Londonderry, UK","School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing and Information Engineering, University of Ulster, Londonderry, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"School of Computing and Information engineering, University of Ulster, Coleraine campus, Co. Londonderry, Northern Ireland, BT52 1SA, UK","institution_ids":["https://openalex.org/I138801177"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3984,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.84165129,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"10","issue":null,"first_page":"380","last_page":"387"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9155516624450684},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.8067253232002258},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7457717657089233},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.6947603225708008},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.6292694807052612},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5085071325302124},{"id":"https://openalex.org/keywords/action-selection","display_name":"Action selection","score":0.47787418961524963},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.46215111017227173},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.4614506959915161},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.45927128195762634},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4279051423072815},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.42399945855140686},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3296704888343811},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3212258219718933}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9155516624450684},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.8067253232002258},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7457717657089233},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.6947603225708008},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.6292694807052612},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5085071325302124},{"id":"https://openalex.org/C166109690","wikidata":"https://www.wikidata.org/wiki/Q4677422","display_name":"Action selection","level":3,"score":0.47787418961524963},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.46215111017227173},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.4614506959915161},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.45927128195762634},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4279051423072815},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.42399945855140686},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3296704888343811},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3212258219718933},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/itw.2010.5593329","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itw.2010.5593329","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2010 IEEE Conference on Computational Intelligence and Games","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.173.6129","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.173.6129","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://game.itu.dk/cig2010/proceedings/papers/cig10_047_094.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1480676279","https://openalex.org/W1488730473","https://openalex.org/W1979685636","https://openalex.org/W2003386389","https://openalex.org/W2013815893","https://openalex.org/W2023837733","https://openalex.org/W2100094927","https://openalex.org/W2121863487","https://openalex.org/W2124175081","https://openalex.org/W2135939192","https://openalex.org/W2160371091","https://openalex.org/W2215343611","https://openalex.org/W3011120880","https://openalex.org/W3139377883","https://openalex.org/W4214717370","https://openalex.org/W4230531009","https://openalex.org/W6629152578","https://openalex.org/W6675136414","https://openalex.org/W6678114464","https://openalex.org/W6683821272","https://openalex.org/W6689185299","https://openalex.org/W6775686901"],"related_works":["https://openalex.org/W1995622179","https://openalex.org/W1484111231","https://openalex.org/W1552543208","https://openalex.org/W2074396517","https://openalex.org/W2166963679","https://openalex.org/W2187269125","https://openalex.org/W1641615907","https://openalex.org/W3089231081","https://openalex.org/W2093956241","https://openalex.org/W2354420595"],"abstract_inverted_index":{"Recently":[0],"there":[1],"has":[2,22],"been":[3,23],"much":[4],"research":[5],"focus":[6],"on":[7],"the":[8,35,81,89],"use":[9],"of":[10,30,38,72,80],"Reinforcement":[11],"Learning":[12],"(RL)":[13],"algorithms":[14],"for":[15],"game":[16],"agent":[17,39],"control.":[18],"However,":[19],"although":[20],"it":[21],"shown":[24],"that":[25],"such":[26],"agents":[27],"are":[28],"capable":[29],"learning":[31],"in":[32,83,103],"real":[33],"time,":[34],"high":[36],"dimensionality":[37,82],"sensor":[40],"state":[41,90],"spaces":[42],"still":[43],"prove":[44],"to":[45,50,57,119],"be":[46],"a":[47,64,69,78],"significant":[48],"barrier":[49],"progress.":[51],"This":[52,115],"paper":[53,116],"outlines":[54],"an":[55],"approach":[56,76,100],"dealing":[58],"with":[59,68,107],"this":[60,99],"issue":[61],"by":[62,87],"using":[63],"modular":[65,75],"RL":[66],"architecture":[67],"fine":[70],"granularity":[71],"modules.":[73],"The":[74],"enables":[77],"reduction":[79],"complex":[84],"game-like":[85],"environments":[86],"dividing":[88],"space":[91],"into":[92],"smaller,":[93],"more":[94],"manageable":[95],"sub":[96],"tasks.":[97],"While":[98],"is":[101],"successful":[102],"reducing":[104],"dimensionality,":[105],"challenges":[106],"action":[108],"selection,":[109],"exploration":[110],"and":[111],"reward":[112],"allocation":[113],"arise.":[114],"discusses":[117],"approaches":[118],"overcoming":[120],"these":[121],"issues.":[122]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
