{"id":"https://openalex.org/W4363671540","doi":"https://doi.org/10.1145/3575870.3587117","title":"Interval Markov Decision Processes with Continuous Action-Spaces","display_name":"Interval Markov Decision Processes with Continuous Action-Spaces","publication_year":2023,"publication_date":"2023-05-08","ids":{"openalex":"https://openalex.org/W4363671540","doi":"https://doi.org/10.1145/3575870.3587117"},"language":"en","primary_location":{"id":"doi:10.1145/3575870.3587117","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575870.3587117","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575870.3587117","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM International Conference on Hybrid Systems: Computation and Control","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3575870.3587117","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013980490","display_name":"Giannis Delimpaltadakis","orcid":"https://orcid.org/0000-0002-2651-0629"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Giannis Delimpaltadakis","raw_affiliation_strings":["Control Systems Technology Group, Mechanical Engineering, Eindhoven University of Technology, Netherlands"],"affiliations":[{"raw_affiliation_string":"Control Systems Technology Group, Mechanical Engineering, Eindhoven University of Technology, Netherlands","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069564559","display_name":"Morteza Lahijanian","orcid":"https://orcid.org/0000-0001-7549-4365"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Morteza Lahijanian","raw_affiliation_strings":["Aerospace Engineering Sciences, University of Colorado Boulder, USA"],"affiliations":[{"raw_affiliation_string":"Aerospace Engineering Sciences, University of Colorado Boulder, USA","institution_ids":["https://openalex.org/I188538660"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019241546","display_name":"Manuel Mazo","orcid":"https://orcid.org/0000-0002-5638-5283"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Manuel Mazo Jr.","raw_affiliation_strings":["Delft Center for Systems and Control, Delft University of Technology, Netherlands"],"affiliations":[{"raw_affiliation_string":"Delft Center for Systems and Control, Delft University of Technology, Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009660282","display_name":"Luca Laurenti","orcid":"https://orcid.org/0000-0003-1190-6097"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Luca Laurenti","raw_affiliation_strings":["Delft Center for Systems and Control, Delft University of Technology, Netherlands"],"affiliations":[{"raw_affiliation_string":"Delft Center for Systems and Control, Delft University of Technology, Netherlands","institution_ids":["https://openalex.org/I98358874"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5013980490"],"corresponding_institution_ids":["https://openalex.org/I83019370"],"apc_list":null,"apc_paid":null,"fwci":1.9662,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.88079119,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11125","display_name":"Petri Nets in System Modeling","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10933","display_name":"Real-Time Systems Scheduling","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.594662070274353},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5674776434898376},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5591835379600525},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5288366079330444},{"id":"https://openalex.org/keywords/interval","display_name":"Interval (graph theory)","score":0.5273657441139221},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.43870651721954346},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2632777690887451},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.15008464455604553},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.13050946593284607},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07816421985626221},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.06783115863800049}],"concepts":[{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.594662070274353},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5674776434898376},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5591835379600525},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5288366079330444},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.5273657441139221},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.43870651721954346},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2632777690887451},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.15008464455604553},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.13050946593284607},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07816421985626221},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.06783115863800049},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3575870.3587117","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575870.3587117","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575870.3587117","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM International Conference on Hybrid Systems: Computation and Control","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.tue.nl:openaire_cris_publications/4ecf616d-7322-43bb-9d33-d7f6a422a7c4","is_oa":true,"landing_page_url":"https://research.tue.nl/en/publications/4ecf616d-7322-43bb-9d33-d7f6a422a7c4","pdf_url":"https://pure.tue.nl/ws/files/307259073/3575870.3587117.pdf","source":{"id":"https://openalex.org/S4406922641","display_name":"TU/e Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Delimpaltadakis, G, Lahijanian, M, Mazo, M & Laurenti, L 2023, Interval Markov Decision Processes with Continuous Action-Spaces. in HSCC 2023 : Proceedings of the 26th ACM International Conference on Hybrid Systems: Computation and Control., 12, Association for Computing Machinery, Inc., New York, pp. 1-10, 26th ACM International Conference on Hybrid Systems: Computation and Control, HSCC 2023, Part of CPS-IoT Week 2023, San Antonio, United States, 9/05/23. https://doi.org/10.1145/3575870.3587117","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:tudelft.nl:uuid:814b2ec0-11a1-4080-a782-c43d100ab130","is_oa":true,"landing_page_url":"http://resolver.tudelft.nl/uuid:814b2ec0-11a1-4080-a782-c43d100ab130","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conference paper"}],"best_oa_location":{"id":"doi:10.1145/3575870.3587117","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575870.3587117","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575870.3587117","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM International Conference on Hybrid Systems: Computation and Control","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7099999785423279}],"awards":[{"id":"https://openalex.org/G6755165505","display_name":null,"funder_award_id":"award","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7650390553","display_name":null,"funder_award_id":"2039062","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8986516849","display_name":null,"funder_award_id":"755953","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4363671540.pdf","grobid_xml":"https://content.openalex.org/works/W4363671540.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W1598511836","https://openalex.org/W1965878388","https://openalex.org/W1975219867","https://openalex.org/W1988217924","https://openalex.org/W2000865099","https://openalex.org/W2070501901","https://openalex.org/W2166280160","https://openalex.org/W3002811560","https://openalex.org/W3006987257","https://openalex.org/W3125855560","https://openalex.org/W3141421587","https://openalex.org/W4205437843"],"related_works":["https://openalex.org/W1660242800","https://openalex.org/W2077211377","https://openalex.org/W2379651310","https://openalex.org/W2113019827","https://openalex.org/W1541249122","https://openalex.org/W2413828414","https://openalex.org/W2367222340","https://openalex.org/W187740018","https://openalex.org/W2162286586","https://openalex.org/W4255368532"],"abstract_inverted_index":{"Interval":[0],"Markov":[1,8],"Decision":[2],"Processes":[3],"(IMDPs)":[4],"are":[5,78,170],"finite-state":[6],"uncertain":[7],"models,":[9],"where":[10,72,107,129,154,167],"the":[11,39,50,73,81,96,110,115,119,155,168,171],"transition":[12,76],"probabilities":[13,77],"belong":[14],"to":[15,38,100,103],"intervals.":[16],"Recently,":[17],"there":[18],"has":[19],"been":[20],"a":[21,58,160,164,184,190],"surge":[22],"of":[23,30,41,80,112,114,122,173],"research":[24],"on":[25,75,183,193],"employing":[26,194],"IMDPs":[27,46,70],"as":[28,196],"abstractions":[29,197],"stochastic":[31],"systems":[32],"for":[33,43,61,88,177,198],"control":[34,199],"synthesis.":[35,200],"However,":[36],"due":[37],"absence":[40],"algorithms":[42],"synthesis":[44,162],"over":[45,132,163],"with":[47,139],"continuous":[48],"action-spaces,":[49],"action-space":[51],"is":[52,57,109,159,175],"assumed":[53],"discrete":[54],"a-priori,":[55],"which":[56],"restrictive":[59],"assumption":[60],"many":[62],"applications.":[63],"Motivated":[64],"by":[65],"this,":[66],"we":[67,94,126,188],"introduce":[68],"continuous-action":[69],"(caIMDPs),":[71],"bounds":[74],"functions":[79],"action":[82,156],"variables,":[83],"and":[84],"study":[85],"value":[86,101,130],"iteration":[87,102,131],"maximizing":[89],"expected":[90],"cumulative":[91],"rewards.":[92],"Specifically,":[93],"decompose":[95],"max-min":[97],"problem":[98],"associated":[99],"|\ud835\udcac|":[104,108],"max":[105,124],"problems,":[106,125],"number":[111],"states":[113],"caIMDP.":[116],"Then,":[117],"exploiting":[118],"simple":[120],"form":[121],"these":[123],"identify":[127],"cases":[128,153],"caIMDPs":[133,195],"can":[134],"be":[135],"solved":[136],"efficiently":[137],"(e.g.,":[138],"linear":[140],"or":[141],"convex":[142],"programming).":[143],"We":[144,179],"also":[145],"gain":[146],"other":[147],"interesting":[148],"insights:":[149],"e.g.,":[150],"in":[151],"certain":[152],"set":[157],"\ud835\udc9c":[158],"polytope,":[161],"discrete-action":[165],"IMDP,":[166],"actions":[169],"vertices":[172],"\ud835\udc9c,":[174],"sufficient":[176],"optimality.":[178],"demonstrate":[180],"our":[181],"results":[182],"numerical":[185],"example.":[186],"Finally,":[187],"include":[189],"short":[191],"discussion":[192]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
