{"id":"https://openalex.org/W7156292032","doi":"https://doi.org/10.48550/arxiv.2604.22244","title":"Learning Control Policies to Provably Satisfy Hard Affine Constraints for Black-Box Hybrid Dynamical Systems","display_name":"Learning Control Policies to Provably Satisfy Hard Affine Constraints for Black-Box Hybrid Dynamical Systems","publication_year":2026,"publication_date":"2026-04-24","ids":{"openalex":"https://openalex.org/W7156292032","doi":"https://doi.org/10.48550/arxiv.2604.22244"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.22244","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22244","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.22244","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109664305","display_name":"Aayushi Shrivastava","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shrivastava, Aayushi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047760830","display_name":"Kartik Nagpal","orcid":"https://orcid.org/0000-0001-8973-5959"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nagpal, Kartik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116671896","display_name":"Sairam Jinkala","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinkala, Sairam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069947744","display_name":"J. Bouvier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bouvier, Jean-Baptiste","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134705742","display_name":"Negar Mehr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mehr, Negar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.4507000148296356,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.4507000148296356,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.13230000436306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.1168999969959259,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dynamical-systems-theory","display_name":"Dynamical systems theory","score":0.6162999868392944},{"id":"https://openalex.org/keywords/affine-transformation","display_name":"Affine transformation","score":0.6018000245094299},{"id":"https://openalex.org/keywords/hybrid-system","display_name":"Hybrid system","score":0.5306000113487244},{"id":"https://openalex.org/keywords/reachability","display_name":"Reachability","score":0.513700008392334},{"id":"https://openalex.org/keywords/reset","display_name":"Reset (finance)","score":0.5077999830245972},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.4993000030517578},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.4796999990940094},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4758000075817108},{"id":"https://openalex.org/keywords/dynamical-system","display_name":"Dynamical system (definition)","score":0.4666000008583069}],"concepts":[{"id":"https://openalex.org/C79379906","wikidata":"https://www.wikidata.org/wiki/Q3174497","display_name":"Dynamical systems theory","level":2,"score":0.6162999868392944},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.6018000245094299},{"id":"https://openalex.org/C50897621","wikidata":"https://www.wikidata.org/wiki/Q2665508","display_name":"Hybrid system","level":2,"score":0.5306000113487244},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.513700008392334},{"id":"https://openalex.org/C2779795794","wikidata":"https://www.wikidata.org/wiki/Q7315343","display_name":"Reset (finance)","level":2,"score":0.5077999830245972},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.4993000030517578},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.4796999990940094},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47600001096725464},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4758000075817108},{"id":"https://openalex.org/C33962884","wikidata":"https://www.wikidata.org/wiki/Q378637","display_name":"Dynamical system (definition)","level":3,"score":0.4666000008583069},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4465999901294708},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3864000141620636},{"id":"https://openalex.org/C110639684","wikidata":"https://www.wikidata.org/wiki/Q20702","display_name":"Pendulum","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.36649999022483826},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33660000562667847},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3253999948501587},{"id":"https://openalex.org/C91581856","wikidata":"https://www.wikidata.org/wiki/Q2707001","display_name":"Nonlinear control","level":3,"score":0.31189998984336853},{"id":"https://openalex.org/C192921069","wikidata":"https://www.wikidata.org/wiki/Q550134","display_name":"Inverted pendulum","level":3,"score":0.30649998784065247},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.30320000648498535},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C77405623","wikidata":"https://www.wikidata.org/wiki/Q598451","display_name":"System dynamics","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.2623000144958496}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.22244","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22244","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.22244","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22244","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.748664915561676,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Ensuring":[0],"safety":[1,25,58,175,220],"for":[2,23,81,107,128],"black-box":[3,82],"hybrid":[4,83,146,193],"dynamical":[5,84,194],"systems":[6,85,195],"presents":[7],"significant":[8],"challenges":[9],"due":[10,131,138],"to":[11,68,98,132,139],"their":[12],"instantaneous":[13,133],"state":[14,76,134],"jumps":[15,135],"and":[16,33,101,189,200],"unknown":[17,109],"explicit":[18],"nonlinear":[19,110],"dynamics.":[20,42],"Existing":[21],"solutions":[22],"strict":[24],"constraint":[26,105,129],"satisfaction,":[27],"like":[28,196],"control":[29],"barrier":[30],"functions":[31],"(CBFs)":[32],"reachability":[34],"analysis,":[35],"rely":[36,50],"on":[37,51,192],"direct":[38],"knowledge":[39],"of":[40,112],"the":[41,95,104,108,113,118,123,145,156,164,197,219],"Similarly,":[43],"safe":[44],"reinforcement":[45],"learning":[46],"(RL)":[47],"approaches":[48],"often":[49],"known":[52],"system":[53,147],"dynamics":[54,111],"or":[55,141],"merely":[56],"discourage":[57],"violations":[59],"through":[60],"reward":[61,187],"shaping.":[62],"In":[63,204],"this":[64],"work,":[65],"we":[66,207],"want":[67],"learn":[69],"RL":[70,96],"policies":[71,173,215],"which":[72,171],"provably":[73],"satisfy":[74,174],"affine":[75,87,100,153],"constraints":[77,176],"in":[78,144,177],"closed":[79,178],"loop":[80],"with":[86,185],"reset":[88,142,157],"maps.":[89],"Our":[90],"key":[91],"insight":[92],"is":[93],"forcing":[94],"policy":[97],"be":[99],"repulsive":[102,152],"near":[103],"boundaries":[106],"system,":[114],"providing":[115],"guarantees":[116],"that":[117,136,158,209],"trajectories":[119],"will":[120],"not":[121],"violate":[122],"constraint.":[124,165],"We":[125,166,180],"further":[126],"account":[127],"violation":[130],"occur":[137],"impacts":[140],"maps":[143],"by":[148],"introducing":[149],"a":[150],"second":[151],"region":[154],"before":[155],"prevents":[159],"post-reset":[160],"states":[161],"from":[162],"violating":[163],"derive":[167],"sufficient":[168],"conditions":[169],"under":[170],"these":[172],"loop.":[179],"also":[181],"compare":[182],"our":[183,210],"approach":[184],"state-of-the-art":[186],"shaping":[188],"learned-CBF":[190],"methods":[191],"constrained":[198],"pendulum":[199],"paddle":[201],"juggler":[202],"environments.":[203],"both":[205],"scenarios,":[206],"show":[208],"methodology":[211],"learns":[212],"higher":[213],"quality":[214],"while":[216],"always":[217],"satisfying":[218],"constraints.":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-28T00:00:00"}
