{"id":"https://openalex.org/W2144913588","doi":"https://doi.org/10.1613/jair.2567","title":"Online Planning Algorithms for POMDPs","display_name":"Online Planning Algorithms for POMDPs","publication_year":2008,"publication_date":"2008-07-29","ids":{"openalex":"https://openalex.org/W2144913588","doi":"https://doi.org/10.1613/jair.2567","mag":"2144913588","pmid":"https://pubmed.ncbi.nlm.nih.gov/19777080"},"language":"en","primary_location":{"id":"doi:10.1613/jair.2567","is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.2567","pdf_url":"https://jair.org/index.php/jair/article/download/10559/25275","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence Research","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://jair.org/index.php/jair/article/download/10559/25275","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057087592","display_name":"St\u00e9phane Ross","orcid":null},"institutions":[{"id":"https://openalex.org/I5023651","display_name":"McGill University","ror":"https://ror.org/01pxwe438","country_code":"CA","type":"education","lineage":["https://openalex.org/I5023651"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"S. Ross","raw_affiliation_strings":["School of Computer Science, McGill University Montreal, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, McGill University Montreal, Canada","institution_ids":["https://openalex.org/I5023651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080591144","display_name":"Jo\u00eblle Pineau","orcid":"https://orcid.org/0000-0003-0747-7250"},"institutions":[{"id":"https://openalex.org/I5023651","display_name":"McGill University","ror":"https://ror.org/01pxwe438","country_code":"CA","type":"education","lineage":["https://openalex.org/I5023651"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"J. Pineau","raw_affiliation_strings":["School of Computer Science, McGill University Montreal, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, McGill University Montreal, Canada","institution_ids":["https://openalex.org/I5023651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057997109","display_name":"S. Paquet","orcid":"https://orcid.org/0000-0001-5953-7003"},"institutions":[{"id":"https://openalex.org/I43406934","display_name":"Universit\u00e9 Laval","ror":"https://ror.org/04sjchr03","country_code":"CA","type":"education","lineage":["https://openalex.org/I43406934"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"S. Paquet","raw_affiliation_strings":["Department of Computer Science and Software Engineering, Laval University, Quebec, Canada#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Software Engineering, Laval University, Quebec, Canada#TAB#","institution_ids":["https://openalex.org/I43406934"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002976111","display_name":"Brahim Chaib-draa","orcid":"https://orcid.org/0000-0001-7615-5154"},"institutions":[{"id":"https://openalex.org/I43406934","display_name":"Universit\u00e9 Laval","ror":"https://ror.org/04sjchr03","country_code":"CA","type":"education","lineage":["https://openalex.org/I43406934"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"B. Chaib-draa","raw_affiliation_strings":["Department of Computer Science and Software Engineering, Laval University, Quebec, Canada#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Software Engineering, Laval University, Quebec, Canada#TAB#","institution_ids":["https://openalex.org/I43406934"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5057087592"],"corresponding_institution_ids":["https://openalex.org/I5023651"],"apc_list":null,"apc_paid":null,"fwci":51.1269,"has_fulltext":true,"cited_by_count":515,"citation_normalized_percentile":{"value":0.99879703,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"32","issue":"2","first_page":"663","last_page":"704"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.9499622583389282},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7886300086975098},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6444786190986633},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6145442128181458},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5308937430381775},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.519550621509552},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4833102226257324},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.4531848132610321},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.43004170060157776},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.4279555678367615},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.42777812480926514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37828412652015686},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3600562810897827},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3118782043457031},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.2799345850944519},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23402827978134155},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.22000858187675476},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13512703776359558}],"concepts":[{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.9499622583389282},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7886300086975098},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6444786190986633},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6145442128181458},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5308937430381775},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.519550621509552},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4833102226257324},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.4531848132610321},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.43004170060157776},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.4279555678367615},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.42777812480926514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37828412652015686},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3600562810897827},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3118782043457031},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.2799345850944519},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23402827978134155},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.22000858187675476},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13512703776359558},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":7,"locations":[{"id":"doi:10.1613/jair.2567","is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.2567","pdf_url":"https://jair.org/index.php/jair/article/download/10559/25275","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence Research","raw_type":"journal-article"},{"id":"pmid:19777080","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/19777080","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The journal of artificial intelligence research","raw_type":null},{"id":"pmh:oai:arXiv.org:1401.3436","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1401.3436","pdf_url":"https://arxiv.org/pdf/1401.3436","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.156.1558","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.156.1558","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://damas.ift.ulaval.ca/publications/RossOnlinePOMDPJAIR.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.329.7978","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.329.7978","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://www.aaai.org/Papers/JAIR/Vol32/JAIR-3217.pdf","raw_type":"text"},{"id":"pmh:oai:pubmedcentral.nih.gov:2748358","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Artif Intell Res","raw_type":"Text"},{"id":"pmh:oai:pubmedcentral.nih.gov:2748358","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2748358","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Artif Intell Res","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1613/jair.2567","is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.2567","pdf_url":"https://jair.org/index.php/jair/article/download/10559/25275","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence Research","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7900000214576721,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321747","display_name":"Fonds Qu\u00e9b\u00e9cois de la Recherche sur la Nature et les Technologies","ror":"https://ror.org/00b9f9778"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2144913588.pdf","grobid_xml":"https://content.openalex.org/works/W2144913588.grobid-xml"},"referenced_works_count":65,"referenced_works":["https://openalex.org/W9419878","https://openalex.org/W34327539","https://openalex.org/W105074360","https://openalex.org/W158205031","https://openalex.org/W183139520","https://openalex.org/W1484113995","https://openalex.org/W1491973539","https://openalex.org/W1494689917","https://openalex.org/W1498235675","https://openalex.org/W1515891729","https://openalex.org/W1532688806","https://openalex.org/W1539216098","https://openalex.org/W1549519846","https://openalex.org/W1556274146","https://openalex.org/W1563965851","https://openalex.org/W1575388622","https://openalex.org/W1581055761","https://openalex.org/W1636455720","https://openalex.org/W1864896197","https://openalex.org/W2009533501","https://openalex.org/W2011418219","https://openalex.org/W2012664173","https://openalex.org/W2032100464","https://openalex.org/W2034221837","https://openalex.org/W2034713309","https://openalex.org/W2034725503","https://openalex.org/W2044375425","https://openalex.org/W2061226732","https://openalex.org/W2096976789","https://openalex.org/W2101421095","https://openalex.org/W2103614073","https://openalex.org/W2105757562","https://openalex.org/W2110962519","https://openalex.org/W2119567691","https://openalex.org/W2134802714","https://openalex.org/W2144283793","https://openalex.org/W2144913588","https://openalex.org/W2149476049","https://openalex.org/W2152475379","https://openalex.org/W2167353639","https://openalex.org/W2168359464","https://openalex.org/W2169294731","https://openalex.org/W2253611143","https://openalex.org/W2271240761","https://openalex.org/W2341171179","https://openalex.org/W2949905447","https://openalex.org/W2963889160","https://openalex.org/W3016548437","https://openalex.org/W3023151133","https://openalex.org/W3101822862","https://openalex.org/W3150017941","https://openalex.org/W4254588228","https://openalex.org/W6607456006","https://openalex.org/W6629836980","https://openalex.org/W6631000544","https://openalex.org/W6639035346","https://openalex.org/W6653037687","https://openalex.org/W6658445969","https://openalex.org/W6675087251","https://openalex.org/W6679977494","https://openalex.org/W6681633084","https://openalex.org/W6682302528","https://openalex.org/W6684794184","https://openalex.org/W6704298589","https://openalex.org/W7001894244"],"related_works":["https://openalex.org/W2999848267","https://openalex.org/W2096013579","https://openalex.org/W52153049","https://openalex.org/W1760611253","https://openalex.org/W1589140671","https://openalex.org/W1515117609","https://openalex.org/W4323315247","https://openalex.org/W131709709","https://openalex.org/W3169161914","https://openalex.org/W4321379664"],"abstract_inverted_index":{"Partially":[0],"Observable":[1],"Markov":[2],"Decision":[3],"Processes":[4],"(POMDPs)":[5],"provide":[6],"a":[7,20,61],"rich":[8],"framework":[9],"for":[10,26],"sequential":[11],"decision-making":[12],"under":[13,109],"uncertainty":[14],"in":[15,75,106],"stochastic":[16],"domains.":[17],"However,":[18],"solving":[19],"POMDP":[21,88,132],"is":[22],"often":[23],"intractable":[24],"except":[25],"small":[27],"problems":[28],"due":[29],"to":[30,64,69,82,100],"their":[31,91,95],"complexity.":[32],"Here,":[33],"we":[34],"focus":[35],"on":[36],"online":[37,87,104,125],"approaches":[38,105],"that":[39,123],"alleviate":[40],"the":[41,54,66,84],"computational":[42],"complexity":[43],"by":[44],"computing":[45],"good":[46],"local":[47],"policies":[48],"at":[49,71],"each":[50,72],"decision":[51],"step":[52,74],"during":[53],"execution.":[55],"Online":[56],"algorithms":[57],"generally":[58],"consist":[59],"of":[60],"lookahead":[62],"search":[63,127],"find":[65],"best":[67],"action":[68],"execute":[70],"time":[73],"an":[76],"environment.":[77],"Our":[78,119],"objectives":[79],"here":[80],"are":[81],"survey":[83],"various":[85,110],"existing":[86],"methods,":[89],"analyze":[90],"properties":[92],"and":[93,97,99],"discuss":[94],"advantages":[96],"disadvantages;":[98],"thoroughly":[101],"evaluate":[102],"these":[103],"different":[107],"environments":[108],"metrics":[111],"(return,":[112],"error":[113],"bound":[114,117],"reduction,":[115],"lower":[116],"improvement).":[118],"experimental":[120],"results":[121],"indicate":[122],"state-of-the-art":[124],"heuristic":[126],"methods":[128],"can":[129],"handle":[130],"large":[131],"domains":[133],"efficiently.":[134]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":23},{"year":2022,"cited_by_count":26},{"year":2021,"cited_by_count":37},{"year":2020,"cited_by_count":45},{"year":2019,"cited_by_count":32},{"year":2018,"cited_by_count":27},{"year":2017,"cited_by_count":28},{"year":2016,"cited_by_count":35},{"year":2015,"cited_by_count":42},{"year":2014,"cited_by_count":32},{"year":2013,"cited_by_count":41},{"year":2012,"cited_by_count":32}],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2025-10-10T00:00:00"}
