{"id":"https://openalex.org/W2052959205","doi":"https://doi.org/10.1145/1160633.1160683","title":"Winning back the CUP for distributed POMDPs","display_name":"Winning back the CUP for distributed POMDPs","publication_year":2006,"publication_date":"2006-05-08","ids":{"openalex":"https://openalex.org/W2052959205","doi":"https://doi.org/10.1145/1160633.1160683","mag":"2052959205"},"language":"en","primary_location":{"id":"doi:10.1145/1160633.1160683","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1160633.1160683","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the fifth international joint conference on Autonomous agents and multiagent systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://ink.library.smu.edu.sg/cgi/viewcontent.cgi?article=1939&context=sis_research","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089113099","display_name":"Pradeep Varakantham","orcid":"https://orcid.org/0000-0001-7342-5745"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Pradeep Varakantham","raw_affiliation_strings":["University of Southern California, Los Angeles, CA","University of Southern California,,,Los Angeles,CA,"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"University of Southern California,,,Los Angeles,CA,","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111597996","display_name":"Ranjit Nair","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I82514191","display_name":"Honeywell (United States)","ror":"https://ror.org/02t71h845","country_code":"US","type":"company","lineage":["https://openalex.org/I82514191"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ranjit Nair","raw_affiliation_strings":["University of Southern California, Los Angeles, CA and Automation and Control Solutions, Honeywell Laboratories, Minneapolis, MN"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA and Automation and Control Solutions, Honeywell Laboratories, Minneapolis, MN","institution_ids":["https://openalex.org/I82514191","https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000327528","display_name":"Milind Tambe","orcid":"https://orcid.org/0000-0003-3296-3672"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Milind Tambe","raw_affiliation_strings":["University of Southern California, Los Angeles, CA","University of Southern California,,,Los Angeles,CA,"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"University of Southern California,,,Los Angeles,CA,","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048575057","display_name":"Makoto Yokoo","orcid":"https://orcid.org/0000-0003-4929-396X"},"institutions":[{"id":"https://openalex.org/I135598925","display_name":"Kyushu University","ror":"https://ror.org/00p4k0j84","country_code":"JP","type":"education","lineage":["https://openalex.org/I135598925"]},{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["JP","US"],"is_corresponding":false,"raw_author_name":"Makoto Yokoo","raw_affiliation_strings":["University of Southern California, Los Angeles, CA and Kyushu University, Fukuoka, Japan"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA and Kyushu University, Fukuoka, Japan","institution_ids":["https://openalex.org/I1174212","https://openalex.org/I135598925"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5089113099"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":1.8751,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.87338821,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"289","last_page":"296"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.8194047212600708},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.8042424917221069},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7378613948822021},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.6394267082214355},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.6339685320854187},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5398480296134949},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5164670944213867},{"id":"https://openalex.org/keywords/problem-solver","display_name":"Problem solver","score":0.47963887453079224},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4542038142681122},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.418795108795166},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.38270318508148193},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.33787423372268677},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33103275299072266},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21022570133209229},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.15549242496490479},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.1501140594482422}],"concepts":[{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.8194047212600708},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.8042424917221069},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7378613948822021},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.6394267082214355},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.6339685320854187},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5398480296134949},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5164670944213867},{"id":"https://openalex.org/C3019612716","wikidata":"https://www.wikidata.org/wiki/Q730920","display_name":"Problem solver","level":2,"score":0.47963887453079224},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4542038142681122},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.418795108795166},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.38270318508148193},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.33787423372268677},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33103275299072266},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21022570133209229},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.15549242496490479},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.1501140594482422},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1160633.1160683","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1160633.1160683","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the fifth international joint conference on Autonomous agents and multiagent systems","raw_type":"proceedings-article"},{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-1939","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/cgi/viewcontent.cgi?article=1939&context=sis_research","pdf_url":null,"source":{"id":"https://openalex.org/S4377196871","display_name":"Institutional Knowledge (InK) - Institutional Knowledge at Singapore Management University (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://dx.doi.org/10.1145/1160633.1160683","raw_type":"Conference Proceeding Article"}],"best_oa_location":{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-1939","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/cgi/viewcontent.cgi?article=1939&context=sis_research","pdf_url":null,"source":{"id":"https://openalex.org/S4377196871","display_name":"Institutional Knowledge (InK) - Institutional Knowledge at Singapore Management University (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://dx.doi.org/10.1145/1160633.1160683","raw_type":"Conference Proceeding Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.75}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W156814138","https://openalex.org/W1491973539","https://openalex.org/W1536258751","https://openalex.org/W1579579904","https://openalex.org/W1588304026","https://openalex.org/W1590759229","https://openalex.org/W1908253641","https://openalex.org/W1993412827","https://openalex.org/W1993428444","https://openalex.org/W2045460737","https://openalex.org/W2107133386","https://openalex.org/W2110158409","https://openalex.org/W2114245943","https://openalex.org/W2137647991","https://openalex.org/W2139806852","https://openalex.org/W2159142421","https://openalex.org/W2161966858","https://openalex.org/W2168359464","https://openalex.org/W3032770570","https://openalex.org/W6635285615","https://openalex.org/W6680970532"],"related_works":["https://openalex.org/W2999848267","https://openalex.org/W2096013579","https://openalex.org/W52153049","https://openalex.org/W1760611253","https://openalex.org/W1589140671","https://openalex.org/W1515117609","https://openalex.org/W4323315247","https://openalex.org/W131709709","https://openalex.org/W2294884454","https://openalex.org/W3169161914"],"abstract_inverted_index":{"Distributed":[0],"Partially":[1],"Observable":[2],"Markov":[3],"Decision":[4],"Problems":[5],"(Distributed":[6],"POMDPs)":[7],"are":[8,119,157],"evolving":[9],"as":[10],"a":[11,48,82,109,126],"popular":[12],"approach":[13],"for":[14,70,162],"modeling":[15],"multiagent":[16],"systems,":[17],"and":[18,145],"many":[19],"different":[20,127],"algorithms":[21,36],"have":[22,37],"been":[23,39],"proposed":[24],"to":[25,72,85],"obtain":[26],"locally":[27,115],"or":[28,42],"globally":[29],"optimal":[30,116],"policies.":[31,100],"Unfortunately,":[32],"most":[33],"of":[34,47,99,122,129,141,153],"these":[35,156],"either":[38],"explicitly":[40,73,86],"designed":[41],"experimentally":[43],"evaluated":[44],"assuming":[45],"knowledge":[46],"starting":[49],"belief":[50,77,93,131,168],"point,":[51],"an":[52,103],"assumption":[53],"that":[54,136],"often":[55],"does":[56],"not":[57],"hold":[58],"in":[59,64,170],"complex,":[60],"uncertain":[61],"domains.":[62],"Instead,":[63],"such":[65],"domains,":[66],"it":[67],"is":[68],"important":[69],"agents":[71],"plan":[74],"over":[75,91,166],"continuous":[76,92,167],"spaces.":[78],"This":[79],"paper":[80],"provides":[81],"novel":[83],"algorithm":[84,144],"compute":[87],"finite":[88],"horizon":[89],"policies":[90,118,165],"spaces,":[94],"without":[95],"restricting":[96],"the":[97,130,139,142,151,158],"space":[98],"By":[101],"marrying":[102],"efficient":[104],"single-agent":[105],"POMDP":[106,112],"solver":[107],"with":[108],"heuristic":[110],"distributed":[111,171],"policy-generation":[113],"algorithm,":[114],"joint":[117],"obtained,":[120],"each":[121],"which":[123],"dominates":[124],"within":[125],"part":[128],"region.":[132],"We":[133],"provide":[134,146],"heuristics":[135],"significantly":[137],"improve":[138],"efficiency":[140],"resulting":[143],"detailed":[147],"experimental":[148],"results.":[149],"To":[150],"best":[152],"our":[154],"knowledge,":[155],"first":[159],"run-time":[160],"results":[161],"analytically":[163],"generating":[164],"spaces":[169],"POMDPs.":[172]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
