{"id":"https://openalex.org/W7128728229","doi":"https://doi.org/10.48550/arxiv.2602.10938","title":"Multi-Environment MDPs with Prior and Universal Semantics","display_name":"Multi-Environment MDPs with Prior and Universal Semantics","publication_year":2026,"publication_date":"2026-02-11","ids":{"openalex":"https://openalex.org/W7128728229","doi":"https://doi.org/10.48550/arxiv.2602.10938"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.10938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004833643","display_name":"Benjamin Bordais","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bordais, Benjamin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125725171","display_name":"Jean-Fran\u00e7ois Raskin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raskin, Jean-Fran\u00e7ois","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5004833643"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.3046000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.3046000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.3012999892234802,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1251000016927719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/unary-operation","display_name":"Unary operation","score":0.7649000287055969},{"id":"https://openalex.org/keywords/decidability","display_name":"Decidability","score":0.6394000053405762},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5647000074386597},{"id":"https://openalex.org/keywords/undecidable-problem","display_name":"Undecidable problem","score":0.4560999870300293},{"id":"https://openalex.org/keywords/infimum-and-supremum","display_name":"Infimum and supremum","score":0.44209998846054077},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4397999942302704},{"id":"https://openalex.org/keywords/pspace","display_name":"PSPACE","score":0.3955000042915344},{"id":"https://openalex.org/keywords/decision-problem","display_name":"Decision problem","score":0.37720000743865967},{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.37709999084472656},{"id":"https://openalex.org/keywords/equivalence","display_name":"Equivalence (formal languages)","score":0.34619998931884766}],"concepts":[{"id":"https://openalex.org/C78023250","wikidata":"https://www.wikidata.org/wiki/Q657596","display_name":"Unary operation","level":2,"score":0.7649000287055969},{"id":"https://openalex.org/C153269930","wikidata":"https://www.wikidata.org/wiki/Q430001","display_name":"Decidability","level":2,"score":0.6394000053405762},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5647000074386597},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5615000128746033},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.5072000026702881},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.4569999873638153},{"id":"https://openalex.org/C192034797","wikidata":"https://www.wikidata.org/wiki/Q3502995","display_name":"Undecidable problem","level":3,"score":0.4560999870300293},{"id":"https://openalex.org/C95611797","wikidata":"https://www.wikidata.org/wiki/Q17502105","display_name":"Infimum and supremum","level":2,"score":0.44209998846054077},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4397999942302704},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39739999175071716},{"id":"https://openalex.org/C197685441","wikidata":"https://www.wikidata.org/wiki/Q500716","display_name":"PSPACE","level":3,"score":0.3955000042915344},{"id":"https://openalex.org/C115988155","wikidata":"https://www.wikidata.org/wiki/Q3262192","display_name":"Decision problem","level":2,"score":0.37720000743865967},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.37709999084472656},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.376800000667572},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.34619998931884766},{"id":"https://openalex.org/C183778304","wikidata":"https://www.wikidata.org/wiki/Q165474","display_name":"Commutative property","level":2,"score":0.337799996137619},{"id":"https://openalex.org/C168773769","wikidata":"https://www.wikidata.org/wiki/Q1350299","display_name":"Satisfiability","level":2,"score":0.3337000012397766},{"id":"https://openalex.org/C167729594","wikidata":"https://www.wikidata.org/wiki/Q17736","display_name":"Axiom","level":2,"score":0.328900009393692},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.3280999958515167},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.30219998955726624},{"id":"https://openalex.org/C2777151079","wikidata":"https://www.wikidata.org/wiki/Q141160","display_name":"Parity (physics)","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C46274116","wikidata":"https://www.wikidata.org/wiki/Q185521","display_name":"Truth value","level":2,"score":0.2840000092983246},{"id":"https://openalex.org/C3309909","wikidata":"https://www.wikidata.org/wiki/Q864155","display_name":"Binary decision diagram","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C135315306","wikidata":"https://www.wikidata.org/wiki/Q866364","display_name":"Bisimulation","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C110251889","wikidata":"https://www.wikidata.org/wiki/Q1569697","display_name":"Model checking","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C39637292","wikidata":"https://www.wikidata.org/wiki/Q908207","display_name":"Complexity class","level":3,"score":0.2676999866962433},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.10938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.10938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.10938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.10938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6683189272880554}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multiple-environment":[0],"Markov":[1],"decision":[2],"processes":[3],"(MEMDPs)":[4],"equip":[5],"an":[6,38,104,192],"MDP":[7],"with":[8,92,106,116,166,214],"several":[9],"probabilistic":[10],"transition":[11],"functions":[12],"(one":[13],"per":[14],"possible":[15],"environment)":[16],"so":[17],"that":[18,72,99,143,185,203,211,223],"the":[19,24,34,41,45,49,62,73,87,100,122,144,148,162,167,188,201],"state":[20],"is":[21,26,51,126],"observable":[22],"but":[23],"environment":[25,50],"not.":[27],"Previous":[28],"work":[29],"studies":[30],"two":[31],"semantics:":[32],"(i)":[33],"universal":[35,145,163],"semantics,":[36,47],"where":[37,48],"adversary":[39],"picks":[40],"environment;":[42],"and":[43,80,208,228],"(ii)":[44],"prior":[46,93,101,151,189],"drawn":[52],"once":[53],"before":[54],"execution":[55],"from":[56],"a":[57,83,107,117,158,220,226],"fixed":[58],"distribution.":[59],"We":[60,140],"clarify":[61],"relation":[63],"between":[64],"these":[65],"semantics.":[66,94],"For":[67],"parity":[68,108],"objectives,":[69],"we":[70,81,97,183,209],"show":[71,98],"qualitative":[74],"questions,":[75],"i.e.":[76],"value":[77,89,102,146],"one,":[78],"coincide,":[79],"develop":[82],"new":[84,159],"algorithm":[85,160],"for":[86,161,171],"general":[88],"of":[90,103,150,196,232],"MEMDP":[91,105],"In":[95],"particular,":[96],"objective":[109],"can":[110],"be":[111],"approximated":[112],"to":[113,219],"any":[114,212],"precision":[115],"space":[118],"efficient":[119],"algorithm;":[120],"equivalently,":[121],"associated":[123],"gap":[124,164],"problem":[125,165],"decidable":[127],"in":[128,134,137,175],"PSPACE":[129],"when":[130],"probabilities":[131],"are":[132],"given":[133],"unary":[135,172],"(and":[136],"EXPSPACE":[138,174],"otherwise).":[139],"then":[141],"prove":[142],"equals":[147],"infimum":[149],"values":[152],"over":[153],"all":[154],"beliefs.":[155],"This":[156],"yields":[157],"same":[168],"complexity":[169],"(PSPACE":[170],"probabilities,":[173],"general),":[176],"improving":[177],"on":[178],"earlier":[179],"doubly-exponential-space":[180],"procedures.":[181],"Finally,":[182],"observe":[184],"MEMDPs":[186],"under":[187],"semantics":[190],"form":[191],"important":[193],"tractable":[194],"subclass":[195,231],"POMDPs:":[197],"our":[198],"algorithms":[199],"exploit":[200],"fact":[202],"belief":[204],"entropy":[205],"never":[206],"increases,":[207],"establish":[210],"POMDP":[213],"this":[215],"property":[216],"reduces":[217],"effectively":[218],"prior-MEMDP,":[221],"showing":[222],"prior-MEMDPs":[224],"capture":[225],"broad":[227],"practically":[229],"relevant":[230],"POMDPs.":[233]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-13T00:00:00"}
