{"id":"https://openalex.org/W3156543906","doi":"https://doi.org/10.1109/cog52621.2021.9619093","title":"Generalising Discrete Action Spaces with Conditional Action Trees","display_name":"Generalising Discrete Action Spaces with Conditional Action Trees","publication_year":2021,"publication_date":"2021-08-17","ids":{"openalex":"https://openalex.org/W3156543906","doi":"https://doi.org/10.1109/cog52621.2021.9619093","mag":"3156543906"},"language":"en","primary_location":{"id":"doi:10.1109/cog52621.2021.9619093","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog52621.2021.9619093","pdf_url":null,"source":{"id":"https://openalex.org/S4363608335","display_name":"2021 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001097029","display_name":"Christopher Bamford","orcid":null},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Christopher Bamford","raw_affiliation_strings":["Game AI Group, Queen Mary University of London, London, UK"],"affiliations":[{"raw_affiliation_string":"Game AI Group, Queen Mary University of London, London, UK","institution_ids":["https://openalex.org/I166337079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110927683","display_name":"Alvaro Ovalle","orcid":null},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alvaro Ovalle","raw_affiliation_strings":["Game AI Group, Queen Mary University of London, London, UK"],"affiliations":[{"raw_affiliation_string":"Game AI Group, Queen Mary University of London, London, UK","institution_ids":["https://openalex.org/I166337079"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001097029"],"corresponding_institution_ids":["https://openalex.org/I166337079"],"apc_list":null,"apc_paid":null,"fwci":0.754,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.73284726,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.7964501976966858},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6334642767906189},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.615104079246521},{"id":"https://openalex.org/keywords/structuring","display_name":"Structuring","score":0.5731866359710693},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5313157439231873},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4984555244445801},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4635241627693176},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.46152395009994507},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.40888792276382446},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3319655954837799},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3265167474746704},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11050701141357422}],"concepts":[{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.7964501976966858},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6334642767906189},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.615104079246521},{"id":"https://openalex.org/C2775945657","wikidata":"https://www.wikidata.org/wiki/Q381442","display_name":"Structuring","level":2,"score":0.5731866359710693},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5313157439231873},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4984555244445801},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4635241627693176},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.46152395009994507},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40888792276382446},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3319655954837799},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3265167474746704},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11050701141357422},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cog52621.2021.9619093","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog52621.2021.9619093","pdf_url":null,"source":{"id":"https://openalex.org/S4363608335","display_name":"2021 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8100000023841858}],"awards":[],"funders":[{"id":"https://openalex.org/F4320311061","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W2098774185","https://openalex.org/W2150823748","https://openalex.org/W2256420211","https://openalex.org/W2594103415","https://openalex.org/W2749807327","https://openalex.org/W2786036274","https://openalex.org/W2890208098","https://openalex.org/W2896873963","https://openalex.org/W2949561945","https://openalex.org/W2951984055","https://openalex.org/W2963312729","https://openalex.org/W2964043796","https://openalex.org/W2965757358","https://openalex.org/W2966219705","https://openalex.org/W2976771233","https://openalex.org/W2982316857","https://openalex.org/W2987288550","https://openalex.org/W2996037775","https://openalex.org/W2996681978","https://openalex.org/W3000752281","https://openalex.org/W3014728935","https://openalex.org/W3037164854","https://openalex.org/W3088749011","https://openalex.org/W3094236223","https://openalex.org/W3103223352","https://openalex.org/W3130564053","https://openalex.org/W4288594419","https://openalex.org/W4297797010","https://openalex.org/W4312309732","https://openalex.org/W6674884181","https://openalex.org/W6692312642","https://openalex.org/W6692846177","https://openalex.org/W6734517396","https://openalex.org/W6743756900","https://openalex.org/W6748638692","https://openalex.org/W6758846586","https://openalex.org/W6760375386","https://openalex.org/W6769975600","https://openalex.org/W6775892990","https://openalex.org/W6779990354"],"related_works":["https://openalex.org/W4394443292","https://openalex.org/W4251394462","https://openalex.org/W1580673008","https://openalex.org/W1510936208","https://openalex.org/W2486167009","https://openalex.org/W1595575899","https://openalex.org/W756498608","https://openalex.org/W2135201366","https://openalex.org/W4285395220","https://openalex.org/W2493576743"],"abstract_inverted_index":{"There":[0],"are":[1],"relatively":[2],"few":[3],"conventions":[4],"followed":[5],"in":[6,61,119],"reinforcement":[7],"learning":[8],"(RL)":[9],"environments":[10,104],"to":[11,24,36,38,63,72,76,110],"structure":[12],"the":[13,19,79],"action":[14,28,59,67,80,108,115],"spaces.":[15],"As":[16],"a":[17,55,74,89],"consequence":[18],"application":[20],"of":[21,57],"RL":[22,62],"algorithms":[23],"tasks":[25],"with":[26,30,49,105,112],"large":[27,113],"spaces":[29,60,109,116],"multiple":[31,86],"components":[32],"require":[33],"additional":[34],"effort":[35],"adjust":[37],"different":[39],"formats.":[40],"In":[41],"this":[42],"paper":[43],"we":[44],"introduce":[45],"Conditional":[46],"Action":[47],"Trees":[48],"two":[50],"main":[51],"objectives:":[52],"(1)":[53],"as":[54],"method":[56],"structuring":[58],"generalise":[64],"across":[65],"several":[66,96],"space":[68,81],"specifications,":[69],"and":[70],"(2)":[71],"formalise":[73],"process":[75],"significantly":[77],"reduce":[78],"by":[82],"decomposing":[83],"it":[84],"into":[85],"sub-spaces,":[87],"favoring":[88],"multi-staged":[90],"decision":[91],"making":[92],"approach.":[93],"We":[94],"show":[95],"proof-of-concept":[97],"experiments":[98],"validating":[99],"our":[100],"scheme,":[101],"ranging":[102],"from":[103],"basic":[106],"discrete":[107],"those":[111],"combinatorial":[114],"commonly":[117],"found":[118],"Real":[120],"Time":[121],"Strategy":[122],"(RTS)":[123],"style":[124],"games.":[125]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
