{"id":"https://openalex.org/W2920937724","doi":"https://doi.org/10.24963/ijcai.2019/50","title":"Compact Representation of Value Function in Partially Observable Stochastic Games","display_name":"Compact Representation of Value Function in Partially Observable Stochastic Games","publication_year":2019,"publication_date":"2019-07-28","ids":{"openalex":"https://openalex.org/W2920937724","doi":"https://doi.org/10.24963/ijcai.2019/50","mag":"2920937724"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2019/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/50","pdf_url":"https://www.ijcai.org/proceedings/2019/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.ijcai.org/proceedings/2019/0050.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103017905","display_name":"Karel Hor\u00e1k","orcid":"https://orcid.org/0000-0003-0307-6281"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Karel Hor\u00e1k","raw_affiliation_strings":["Czech Technical University in Prague, FEE, Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"Czech Technical University in Prague, FEE, Department of Computer Science","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052350897","display_name":"Branislav Bo\u0161ansk\u00fd","orcid":"https://orcid.org/0000-0002-3841-9515"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Branislav Bo\u0161ansk\u00fd","raw_affiliation_strings":["Czech Technical University in Prague, FEE, Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"Czech Technical University in Prague, FEE, Department of Computer Science","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020091080","display_name":"Christopher Kiekintveld","orcid":"https://orcid.org/0000-0003-0615-9584"},"institutions":[{"id":"https://openalex.org/I164936912","display_name":"The University of Texas at El Paso","ror":"https://ror.org/04d5vba33","country_code":"US","type":"education","lineage":["https://openalex.org/I164936912"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Kiekintveld","raw_affiliation_strings":["The University of Texas at El Paso, Computer Science Department"],"affiliations":[{"raw_affiliation_string":"The University of Texas at El Paso, Computer Science Department","institution_ids":["https://openalex.org/I164936912"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090126029","display_name":"Charles Kamhoua","orcid":"https://orcid.org/0000-0003-2169-5975"},"institutions":[{"id":"https://openalex.org/I166416128","display_name":"DEVCOM Army Research Laboratory","ror":"https://ror.org/011hc8f90","country_code":"US","type":"government","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I166416128","https://openalex.org/I2802705668","https://openalex.org/I4210154437"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Charles Kamhoua","raw_affiliation_strings":["Army Research Laboratory, Network Security Branch"],"affiliations":[{"raw_affiliation_string":"Army Research Laboratory, Network Security Branch","institution_ids":["https://openalex.org/I166416128"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103017905"],"corresponding_institution_ids":["https://openalex.org/I44504214"],"apc_list":null,"apc_paid":null,"fwci":0.289,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64825472,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"350","last_page":"356"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.8864961862564087},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6842374205589294},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.6725753545761108},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.6390128135681152},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6166980266571045},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.5588765144348145},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.5309640169143677},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4825672209262848},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4690096080303192},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4647974371910095},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.4360954761505127},{"id":"https://openalex.org/keywords/stochastic-game","display_name":"Stochastic game","score":0.4268966317176819},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.41229212284088135},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3838510513305664},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.37560784816741943},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3155477046966553},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.3037281632423401},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.21020177006721497},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19185248017311096}],"concepts":[{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.8864961862564087},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6842374205589294},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.6725753545761108},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.6390128135681152},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6166980266571045},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.5588765144348145},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.5309640169143677},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4825672209262848},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4690096080303192},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4647974371910095},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.4360954761505127},{"id":"https://openalex.org/C22171661","wikidata":"https://www.wikidata.org/wiki/Q1074380","display_name":"Stochastic game","level":2,"score":0.4268966317176819},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.41229212284088135},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3838510513305664},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37560784816741943},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3155477046966553},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3037281632423401},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.21020177006721497},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19185248017311096},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.24963/ijcai.2019/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/50","pdf_url":"https://www.ijcai.org/proceedings/2019/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1903.05511","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1903.05511","pdf_url":"https://arxiv.org/pdf/1903.05511","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2920937724","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1903.05511v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1903.05511","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1903.05511","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2019/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2019/50","pdf_url":"https://www.ijcai.org/proceedings/2019/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2043895709","display_name":null,"funder_award_id":"W911NF-13-2-0045","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G2933859987","display_name":null,"funder_award_id":"19-24384Y","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G3732666562","display_name":null,"funder_award_id":"W911NF-13","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G4307486606","display_name":null,"funder_award_id":"W911NF-13-2-0045 (ARL Cyber Security CRA)","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G5259331294","display_name":null,"funder_award_id":"W911NF","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G8763038417","display_name":null,"funder_award_id":"Cooperative Agreement Number W911NF-13-2-0045","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"}],"funders":[{"id":"https://openalex.org/F4320321006","display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky","ror":"https://ror.org/01pv73b02"},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2920937724.pdf","grobid_xml":"https://content.openalex.org/works/W2920937724.grobid-xml"},"referenced_works_count":19,"referenced_works":["https://openalex.org/W40650588","https://openalex.org/W48497080","https://openalex.org/W167683769","https://openalex.org/W568984285","https://openalex.org/W2115965563","https://openalex.org/W2116753650","https://openalex.org/W2134802714","https://openalex.org/W2156950870","https://openalex.org/W2160558706","https://openalex.org/W2292491317","https://openalex.org/W2295821324","https://openalex.org/W2525047520","https://openalex.org/W2528455759","https://openalex.org/W2570857898","https://openalex.org/W2604925955","https://openalex.org/W2735877174","https://openalex.org/W2764010900","https://openalex.org/W2808345529","https://openalex.org/W2904779604"],"related_works":["https://openalex.org/W3213761785","https://openalex.org/W2134991397","https://openalex.org/W2185777745","https://openalex.org/W2181316235","https://openalex.org/W2909951968","https://openalex.org/W2534118885","https://openalex.org/W2107654715","https://openalex.org/W2115058129","https://openalex.org/W4281796895","https://openalex.org/W3003646794","https://openalex.org/W3121168206","https://openalex.org/W2294226876","https://openalex.org/W2593052414","https://openalex.org/W2152706713","https://openalex.org/W190219697","https://openalex.org/W2146883452","https://openalex.org/W2963536720","https://openalex.org/W2133033455","https://openalex.org/W2809993672","https://openalex.org/W3102760497"],"abstract_inverted_index":{"Value":[0],"methods":[1],"for":[2,105],"solving":[3,106],"stochastic":[4,88,107],"games":[5,89,108],"with":[6,109],"partial":[7,110],"observability":[8],"model":[9],"the":[10,13,23,26,30,60,83,116,120,128,131],"uncertainty":[11,84],"of":[12,25,32,56,66,82,130],"players":[14],"as":[15],"a":[16,78,92],"probability":[17],"distribution":[18],"over":[19],"possible":[20],"states,":[21],"where":[22],"dimension":[24,69],"belief":[27],"space":[28],"is":[29,99],"number":[31],"states.":[33],"For":[34],"many":[35,41],"practical":[36],"problems,":[37],"there":[38],"are":[39,76],"exponentially":[40],"states":[42],"which":[43],"causes":[44],"scalability":[45,125],"problems.":[46],"We":[47],"propose":[48],"an":[49],"abstraction":[50],"technique":[51],"that":[52,98,115],"addresses":[53],"this":[54,96],"curse":[55],"dimensionality":[57],"by":[58],"projecting":[59],"high-dimensional":[61],"beliefs":[62],"onto":[63],"characteristic":[64],"vectors":[65],"significantly":[67],"lower":[68],"(e.g.,":[70],"marginal":[71],"probabilities).":[72],"Our":[73],"main":[74],"contributions":[75],"(1)":[77],"novel":[79,93],"compact":[80,121],"representation":[81,97,122],"in":[85],"partially":[86],"observable":[87],"and":[90],"(2)":[91],"algorithm":[94,118],"using":[95,119],"based":[100],"on":[101],"existing":[102],"state-of-the-art":[103],"algorithms":[104],"observability.":[111],"Experimental":[112],"evaluation":[113],"confirms":[114],"new":[117],"dramatically":[123],"increases":[124],"compared":[126],"to":[127],"state":[129],"art.":[132]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
