{"id":"https://openalex.org/W7155533611","doi":"https://doi.org/10.48550/arxiv.2604.21256","title":"Robustness Analysis of POMDP Policies to Observation Perturbations","display_name":"Robustness Analysis of POMDP Policies to Observation Perturbations","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7155533611","doi":"https://doi.org/10.48550/arxiv.2604.21256"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.21256","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21256","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.21256","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061462804","display_name":"Benjamin Kraske","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kraske, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134494741","display_name":"Qi Heng Ho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ho, Qi Heng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134511077","display_name":"Federico Rossi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rossi, Federico","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134488827","display_name":"Morteza Lahijanian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lahijanian, Morteza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134483239","display_name":"Zachary Sunberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sunberg, Zachary","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6481999754905701,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6481999754905701,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.0478999987244606,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.04309999942779541,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8271999955177307},{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.8090000152587891},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5692999958992004},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5098999738693237},{"id":"https://openalex.org/keywords/soundness","display_name":"Soundness","score":0.4643999934196472},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.40119999647140503},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.3614000082015991},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.36039999127388}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8271999955177307},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.8090000152587891},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5842999815940857},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5692999958992004},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5637999773025513},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5098999738693237},{"id":"https://openalex.org/C39920170","wikidata":"https://www.wikidata.org/wiki/Q693083","display_name":"Soundness","level":2,"score":0.4643999934196472},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.40119999647140503},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.36039999127388},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3230000138282776},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.3215999901294708},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.31940001249313354},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30820000171661377},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.29789999127388},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.28450000286102295},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C151376022","wikidata":"https://www.wikidata.org/wiki/Q168698","display_name":"Exponential function","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C31531917","wikidata":"https://www.wikidata.org/wiki/Q915157","display_name":"Robust control","level":3,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.21256","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21256","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.21256","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21256","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8050127625465393}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Policies":[0],"for":[1,192],"Partially":[2],"Observable":[3],"Markov":[4],"Decision":[5],"Processes":[6],"(POMDPs)":[7],"are":[8,92,157],"often":[9],"designed":[10],"using":[11,141],"a":[12,69,80,119],"nominal":[13],"system":[14,25],"model.":[15,54],"In":[16],"practice,":[17],"this":[18,201],"model":[19,72],"can":[20,104,115],"deviate":[21],"from":[22,250],"the":[23,51,57,64,75,87,99,110,125,131,134,145,149,174,194,208,218,228,257,261],"true":[24],"during":[26],"deployment":[27],"due":[28],"to":[29,39,62,166,236],"factors":[30],"such":[31],"as":[32,118],"calibration":[33],"drift":[34],"or":[35],"sensor":[36],"degradation,":[37],"leading":[38],"unexpected":[40],"performance":[41],"degradation.":[42],"This":[43,137],"work":[44],"studies":[45,249],"policy":[46],"robustness":[47],"against":[48],"deviations":[49,91],"in":[50,68,123,130,144,173,207,217],"POMDP":[52,237],"observation":[53,71,135],"We":[55,83,107,180,199,221,245],"introduce":[56],"Policy":[58,111],"Observation":[59,112],"Robustness":[60,113],"Problem:":[61],"determine":[63],"maximum":[65],"tolerable":[66],"deviation":[67],"POMDP's":[70],"that":[73,109,154],"guarantees":[74],"policy's":[76],"value":[77],"remains":[78],"above":[79],"specified":[81],"threshold.":[82],"analyze":[84],"two":[85],"variants:":[86],"sticky":[88,195,219],"variant,":[89,101,151],"where":[90,102],"dependent":[93],"on":[94,171],"state":[95],"and":[96,98,189,196,211,226,252,263],"actions,":[97],"non-sticky":[100,150,197,209],"they":[103],"be":[105,116],"history-dependent.":[106],"show":[108,153,200],"Problem":[114],"formulated":[117],"bi-level":[120],"optimization":[121,127],"problem":[122,262],"which":[124,169,255],"inner":[126],"is":[128,164],"monotonic":[129],"size":[132],"of":[133,230,232,241,243,260],"deviation.":[136],"enables":[138],"efficient":[139],"solutions":[140],"root-finding":[142],"algorithms":[143],"outer":[146],"optimization.":[147],"For":[148],"we":[152],"when":[155],"policies":[156],"represented":[158],"with":[159,187,239],"finite-state":[160],"controllers":[161],"(FSCs)":[162],"it":[163],"sufficient":[165],"consider":[167],"observations":[168],"depend":[170],"nodes":[172],"FSC":[175],"rather":[176],"than":[177],"full":[178],"histories.":[179],"present":[181],"Robust":[182,233],"Interval":[183,234],"Search,":[184],"an":[185],"algorithm":[186,202],"soundness":[188],"convergence":[190],"guarantees,":[191],"both":[193],"variants.":[198],"has":[203],"polynomial":[204],"time":[205,215],"complexity":[206,216],"variant":[210],"at":[212],"most":[213],"exponential":[214],"variant.":[220],"provide":[222,247],"experimental":[223],"results":[224],"validating":[225],"demonstrating":[227],"scalability":[229],"implementations":[231],"Search":[235],"problems":[238],"tens":[240],"thousands":[242],"states.":[244],"also":[246],"case":[248],"robotics":[251],"operations":[253],"research":[254],"demonstrate":[256],"practical":[258],"utility":[259],"algorithms.":[264]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-25T00:00:00"}
