{"id":"https://openalex.org/W3190944559","doi":"https://doi.org/10.1109/cog52621.2021.9619004","title":"An Approach to Partial Observability in Games: Learning to Both Act and Observe","display_name":"An Approach to Partial Observability in Games: Learning to Both Act and Observe","publication_year":2021,"publication_date":"2021-08-17","ids":{"openalex":"https://openalex.org/W3190944559","doi":"https://doi.org/10.1109/cog52621.2021.9619004","mag":"3190944559"},"language":"en","primary_location":{"id":"doi:10.1109/cog52621.2021.9619004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog52621.2021.9619004","pdf_url":null,"source":{"id":"https://openalex.org/S4363608335","display_name":"2021 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110069714","display_name":"Elizabeth Gilmour","orcid":null},"institutions":[{"id":"https://openalex.org/I1288214837","display_name":"United States Naval Research Laboratory","ror":"https://ror.org/04d23a975","country_code":"US","type":"facility","lineage":["https://openalex.org/I1288214837","https://openalex.org/I1330347796","https://openalex.org/I175003984","https://openalex.org/I3130687028"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Elizabeth Gilmour","raw_affiliation_strings":["Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory,Washington D.C.,U.S.A","Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory, Washington D.C., U.S.A"],"affiliations":[{"raw_affiliation_string":"Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory,Washington D.C.,U.S.A","institution_ids":["https://openalex.org/I1288214837"]},{"raw_affiliation_string":"Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory, Washington D.C., U.S.A","institution_ids":["https://openalex.org/I1288214837"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064644874","display_name":"Noah Plotkin","orcid":null},"institutions":[{"id":"https://openalex.org/I70571728","display_name":"Oberlin College","ror":"https://ror.org/05ac26z88","country_code":"US","type":"education","lineage":["https://openalex.org/I70571728"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Noah Plotkin","raw_affiliation_strings":["Oberlin College,Oberlin,OH,U.S.A","Oberlin College, Oberlin, OH, U.S.A"],"affiliations":[{"raw_affiliation_string":"Oberlin College,Oberlin,OH,U.S.A","institution_ids":["https://openalex.org/I70571728"]},{"raw_affiliation_string":"Oberlin College, Oberlin, OH, U.S.A","institution_ids":["https://openalex.org/I70571728"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102486693","display_name":"Leslie N. Smith","orcid":"https://orcid.org/0000-0002-1930-1650"},"institutions":[{"id":"https://openalex.org/I1288214837","display_name":"United States Naval Research Laboratory","ror":"https://ror.org/04d23a975","country_code":"US","type":"facility","lineage":["https://openalex.org/I1288214837","https://openalex.org/I1330347796","https://openalex.org/I175003984","https://openalex.org/I3130687028"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Leslie N. Smith","raw_affiliation_strings":["Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory,Washington D.C.,U.S.A","Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory, Washington D.C., U.S.A"],"affiliations":[{"raw_affiliation_string":"Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory,Washington D.C.,U.S.A","institution_ids":["https://openalex.org/I1288214837"]},{"raw_affiliation_string":"Naval Center for Applied Research in A.I. U.S. Naval Research Laboratory, Washington D.C., U.S.A","institution_ids":["https://openalex.org/I1288214837"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110069714"],"corresponding_institution_ids":["https://openalex.org/I1288214837"],"apc_list":null,"apc_paid":null,"fwci":0.2513,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.48485698,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"01","last_page":"05"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9717000126838684,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8240873217582703},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7533321380615234},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.6575916409492493},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4718114137649536},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4427908658981323},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.43749678134918213},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.42173975706100464},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4214051067829132},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.41166555881500244}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8240873217582703},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7533321380615234},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.6575916409492493},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4718114137649536},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4427908658981323},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.43749678134918213},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.42173975706100464},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4214051067829132},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.41166555881500244},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cog52621.2021.9619004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cog52621.2021.9619004","pdf_url":null,"source":{"id":"https://openalex.org/S4363608335","display_name":"2021 IEEE Conference on Games (CoG)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.4699999988079071,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1757796397","https://openalex.org/W2145339207","https://openalex.org/W2147527908","https://openalex.org/W2564920024","https://openalex.org/W2749807327","https://openalex.org/W2769883686","https://openalex.org/W2777032727","https://openalex.org/W2948609886","https://openalex.org/W2951527505","https://openalex.org/W2962832483","https://openalex.org/W2982316857","https://openalex.org/W2996726407","https://openalex.org/W3006702859","https://openalex.org/W3012502279","https://openalex.org/W3012544020","https://openalex.org/W3012550998","https://openalex.org/W3013618273","https://openalex.org/W3034956653","https://openalex.org/W3036185205","https://openalex.org/W3085438811","https://openalex.org/W3101438731","https://openalex.org/W3119997354","https://openalex.org/W3125947392","https://openalex.org/W3132159782","https://openalex.org/W4206706211","https://openalex.org/W4287324772","https://openalex.org/W4295720520","https://openalex.org/W4298857966","https://openalex.org/W6637967152","https://openalex.org/W6682137061","https://openalex.org/W6731192180","https://openalex.org/W6743756900","https://openalex.org/W6763704883","https://openalex.org/W6771787661","https://openalex.org/W6773667692","https://openalex.org/W6775522024","https://openalex.org/W6775683342","https://openalex.org/W6779827379","https://openalex.org/W6788556936","https://openalex.org/W6791217551"],"related_works":["https://openalex.org/W2046459260","https://openalex.org/W2765830098","https://openalex.org/W2967463586","https://openalex.org/W1971989957","https://openalex.org/W2517338020","https://openalex.org/W3157641275","https://openalex.org/W4312300846","https://openalex.org/W4206221578","https://openalex.org/W3029572990","https://openalex.org/W2615757685"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,6],"(RL)":[2],"is":[3,14,35],"successful":[4],"at":[5,67],"to":[7,52,56,65,83,105,110,114,118,124,131,147,150,155,169,177],"play":[8,119,178],"games":[9,23,42,104],"where":[10,31,51,82,113,126,149],"the":[11,32,68,78,100,107,120,127,145,158,164,166,173,179],"entire":[12,33],"environment":[13,34,101],"visible.":[15,37],"However,":[16],"RL":[17,108,128,174],"approaches":[18],"are":[19],"challenged":[20],"in":[21,28,63,85,102,122,157],"complex":[22,41],"like":[24],"Starcraft":[25],"II":[26],"and":[27,54,116,141,152],"real-world":[29],"environments":[30],"not":[36],"In":[38,133],"these":[39],"more":[40,44],"with":[43,73,87],"limited":[45,60,89],"visual":[46,61,90],"information,":[47],"agents":[48],"must":[49],"choose":[50,148],"look":[53,84,115,151],"how":[55,117,172],"optimally":[57],"use":[58],"their":[59],"information":[62],"order":[64,123],"succeed":[66],"game.":[69,160,180],"We":[70,92],"verify":[71],"that":[72],"a":[74,88,94,137],"relatively":[75],"simple":[76],"model":[77],"agent":[79,109,129,146,167,175],"can":[80],"learn":[81,111],"scenarios":[86],"bandwidth.":[91],"develop":[93,136],"method":[95,142],"for":[96,143],"masking":[97],"part":[98],"of":[99],"Atari":[103],"force":[106],"both":[112],"game":[121],"study":[125],"learns":[130,168,176],"look.":[132],"addition,":[134],"we":[135,162],"neural":[138],"network":[139],"architecture":[140],"allowing":[144],"what":[153],"action":[154],"take":[156],"Pong":[159],"Further,":[161],"analyze":[163],"strategies":[165],"better":[170],"understand":[171]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
