{"id":"https://openalex.org/W2895196950","doi":"https://doi.org/10.1007/978-3-030-17462-0_27","title":"Omega-Regular Objectives in Model-Free Reinforcement Learning","display_name":"Omega-Regular Objectives in Model-Free Reinforcement Learning","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2895196950","doi":"https://doi.org/10.1007/978-3-030-17462-0_27","mag":"2895196950"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-17462-0_27","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-17462-0_27","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-17462-0_27.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-17462-0_27.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030417706","display_name":"Ernst Moritz Hahn","orcid":"https://orcid.org/0000-0002-9348-7684"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Ernst Moritz Hahn","raw_affiliation_strings":["School of EEECS, Queen\u2019s University Belfast, Belfast, UK","State Key Laboratory of Computer Science, Institute of Software, CAS, Beijing, People\u2019s Republic of China","School of EEECS, Queen's University Belfast, Belfast, UK"],"affiliations":[{"raw_affiliation_string":"School of EEECS, Queen\u2019s University Belfast, Belfast, UK","institution_ids":["https://openalex.org/I126231945"]},{"raw_affiliation_string":"State Key Laboratory of Computer Science, Institute of Software, CAS, Beijing, People\u2019s Republic of China","institution_ids":["https://openalex.org/I4210128818"]},{"raw_affiliation_string":"School of EEECS, Queen's University Belfast, Belfast, UK","institution_ids":["https://openalex.org/I126231945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084221298","display_name":"Mateo Perez","orcid":"https://orcid.org/0000-0003-4220-3212"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mateo Perez","raw_affiliation_strings":["Department of ECEE, University of Colorado Boulder, Boulder, USA"],"affiliations":[{"raw_affiliation_string":"Department of ECEE, University of Colorado Boulder, Boulder, USA","institution_ids":["https://openalex.org/I188538660"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041836791","display_name":"Sven Schewe","orcid":"https://orcid.org/0000-0002-9093-9518"},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sven Schewe","raw_affiliation_strings":["Department of Computer Science, University of Liverpool, Liverpool, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, UK","institution_ids":["https://openalex.org/I146655781"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077549627","display_name":"Fabio Somenzi","orcid":"https://orcid.org/0000-0002-2085-2003"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fabio Somenzi","raw_affiliation_strings":["Department of ECEE, University of Colorado Boulder, Boulder, USA"],"affiliations":[{"raw_affiliation_string":"Department of ECEE, University of Colorado Boulder, Boulder, USA","institution_ids":["https://openalex.org/I188538660"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020302140","display_name":"Ashutosh Trivedi","orcid":"https://orcid.org/0000-0001-9346-0126"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ashutosh Trivedi","raw_affiliation_strings":["Department of Computer Science, University of Colorado Boulder, Boulder, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Colorado Boulder, Boulder, USA","institution_ids":["https://openalex.org/I188538660"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001234060","display_name":"Dominik Wojtczak","orcid":"https://orcid.org/0000-0001-5560-0546"},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Dominik Wojtczak","raw_affiliation_strings":["Department of Computer Science, University of Liverpool, Liverpool, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, UK","institution_ids":["https://openalex.org/I146655781"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5020302140"],"corresponding_institution_ids":["https://openalex.org/I188538660"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":37.1704,"has_fulltext":true,"cited_by_count":117,"citation_normalized_percentile":{"value":0.99891634,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"395","last_page":"412"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8472685813903809},{"id":"https://openalex.org/keywords/reachability","display_name":"Reachability","score":0.7329091429710388},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6451877951622009},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6281360983848572},{"id":"https://openalex.org/keywords/omega","display_name":"Omega","score":0.570319414138794},{"id":"https://openalex.org/keywords/constructive","display_name":"Constructive","score":0.5447379946708679},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5399112701416016},{"id":"https://openalex.org/keywords/learning-automata","display_name":"Learning automata","score":0.4324547052383423},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.41167712211608887},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.4109310209751129},{"id":"https://openalex.org/keywords/automaton","display_name":"Automaton","score":0.40761592984199524},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3624923825263977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3410126566886902},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.32608848810195923},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.322066068649292},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07347780466079712},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.06440672278404236}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8472685813903809},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.7329091429710388},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6451877951622009},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6281360983848572},{"id":"https://openalex.org/C2779557605","wikidata":"https://www.wikidata.org/wiki/Q9890","display_name":"Omega","level":2,"score":0.570319414138794},{"id":"https://openalex.org/C2778701210","wikidata":"https://www.wikidata.org/wiki/Q28130034","display_name":"Constructive","level":3,"score":0.5447379946708679},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5399112701416016},{"id":"https://openalex.org/C2776807809","wikidata":"https://www.wikidata.org/wiki/Q6510160","display_name":"Learning automata","level":3,"score":0.4324547052383423},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.41167712211608887},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.4109310209751129},{"id":"https://openalex.org/C112505250","wikidata":"https://www.wikidata.org/wiki/Q787116","display_name":"Automaton","level":2,"score":0.40761592984199524},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3624923825263977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3410126566886902},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32608848810195923},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.322066068649292},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07347780466079712},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.06440672278404236},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/978-3-030-17462-0_27","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-17462-0_27","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-17462-0_27.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:ris.utwente.nl:openaire/653473f3-e6d1-479c-afe3-0a8217513e4d","is_oa":true,"landing_page_url":"https://research.utwente.nl/en/publications/653473f3-e6d1-479c-afe3-0a8217513e4d","pdf_url":null,"source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Hahn, E M, Perez, M, Schewe, S, Somenzi, F, Trivedi, A, Trivedi, A & Wojtczak, D 2019, Omega-Regular Objectives in Model-Free Reinforcement Learning. in T Vojnar & L Zhang (eds), Tools and Algorithms for the Construction and Analysis of Systems : 25th International Conference, TACAS 2019, Held as Part of the European Joint Conferences on Theory and Practice of Software, ETAPS 2019, Prague, Czech Republic, April 6\u201311, 2019, Proceedings. vol. Part I, Lecture Notes in Computer Science, vol. 11427, Springer, Cham, pp. 395-412, 25th International Conference on Tools and Algorithms for the Construction and Analysis of Systems conference series, TACAS 2019 , Prague, Czech Republic, 6/04/19. https://doi.org/10.1007/978-3-030-17462-0_27","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.qub.ac.uk/portal:publications/ca9e42da-37ec-4352-818f-7fbd8f62c5f9","is_oa":true,"landing_page_url":"https://pure.qub.ac.uk/en/publications/ca9e42da-37ec-4352-818f-7fbd8f62c5f9","pdf_url":"https://pureadmin.qub.ac.uk/ws/files/188308185/Hahn2019_Chapter_Omega_RegularObjectivesInModel.pdf","source":{"id":"https://openalex.org/S4306402319","display_name":"Research Portal (Queen's University Belfast)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I126231945","host_organization_name":"Queen's University Belfast","host_organization_lineage":["https://openalex.org/I126231945"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Hahn, E M, Perez, M, Schewe, S, Somenzi, F, Trivedi, A & Liverpool, U 2019, Omega-Regular Objectives in Model-Free Reinforcement Learning. in TACAS: International Conference on Tools and Algorithms for the Construction and Analysis of Systems. vol. 11427, Lecture Notes in Computer Science, vol. 11427, Springer Lecture Notes in Computer Science (LNCS), pp. 395-412. https://doi.org/10.1007/978-3-030-17462-0_27","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:ris.utwente.nl:publications/653473f3-e6d1-479c-afe3-0a8217513e4d","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"doi:10.1007/978-3-030-17462-0_27","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-17462-0_27","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-17462-0_27.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.800000011920929,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1119163446","display_name":null,"funder_award_id":"EP/M027287/1 and EP/P020909/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G1361938442","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3525752471","display_name":null,"funder_award_id":"617611360","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4968910455","display_name":"Solving Parity Games in Theory and Practice","funder_award_id":"EP/P020909/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6898068357","display_name":null,"funder_award_id":"EP/M027287/1 and EP/P020909/1.","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6979878578","display_name":null,"funder_award_id":"61761136011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7457441254","display_name":null,"funder_award_id":"61761136","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7468986614","display_name":null,"funder_award_id":"61532019","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G772980944","display_name":"Energy Efficient Control","funder_award_id":"EP/M027287/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7815803692","display_name":null,"funder_award_id":"EP/P020909/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8208342437","display_name":null,"funder_award_id":"1 and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8525945721","display_name":null,"funder_award_id":"EP/M027287/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8719353587","display_name":null,"funder_award_id":"EP/P0","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320332538","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2895196950.pdf","grobid_xml":"https://content.openalex.org/works/W2895196950.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W163688550","https://openalex.org/W166862392","https://openalex.org/W986424706","https://openalex.org/W1498432697","https://openalex.org/W1506588809","https://openalex.org/W1541799124","https://openalex.org/W1545803195","https://openalex.org/W1556387789","https://openalex.org/W1563982778","https://openalex.org/W1862398452","https://openalex.org/W1972203711","https://openalex.org/W1989863177","https://openalex.org/W2020293036","https://openalex.org/W2071659383","https://openalex.org/W2093916942","https://openalex.org/W2101786389","https://openalex.org/W2107209406","https://openalex.org/W2119567691","https://openalex.org/W2121863487","https://openalex.org/W2124339220","https://openalex.org/W2129670787","https://openalex.org/W2145339207","https://openalex.org/W2165161585","https://openalex.org/W2248015474","https://openalex.org/W2257979135","https://openalex.org/W2334782222","https://openalex.org/W2395891450","https://openalex.org/W2487186542","https://openalex.org/W2521432080","https://openalex.org/W2567705466","https://openalex.org/W2784931892","https://openalex.org/W2914702425","https://openalex.org/W2953302092","https://openalex.org/W2962806365","https://openalex.org/W2963778636","https://openalex.org/W2963794592","https://openalex.org/W4214717370","https://openalex.org/W4237456806","https://openalex.org/W4307347247","https://openalex.org/W6757795073","https://openalex.org/W6780559895","https://openalex.org/W7057282354"],"related_works":["https://openalex.org/W1554767603","https://openalex.org/W2130664212","https://openalex.org/W2100426849","https://openalex.org/W4367628379","https://openalex.org/W4382045631","https://openalex.org/W2032445854","https://openalex.org/W2489338148","https://openalex.org/W576785828","https://openalex.org/W1545451257","https://openalex.org/W2613833673"],"abstract_inverted_index":{"We":[0,19,60,106],"provide":[1],"the":[2,25,52,56,72,101,104],"first":[3],"solution":[4],"for":[5,14],"model-free":[6],"reinforcement":[7,93],"learning":[8,43,94,116],"of":[9,28,54,71,103,111],"$$\\omega":[10,29,62],"$$":[11,30,63],"-regular":[12,31,64],"objectives":[13,32],"Markov":[15],"decision":[16],"processes":[17],"(MDPs).":[18],"present":[20,107],"a":[21],"constructive":[22],"reduction":[23],"from":[24,100],"almost-sure":[26,35],"satisfaction":[27],"to":[33,42,45,89,96],"an":[34,47,108],"reachability":[36],"problem,":[37],"and":[38],"extend":[39],"this":[40,76],"technique":[41,113],"how":[44],"control":[46],"unknown":[48],"model":[49],"so":[50],"that":[51,80],"chance":[53],"satisfying":[55],"objective":[57],"is":[58],"maximized.":[59],"compile":[61],"properties":[65],"into":[66],"limit-deterministic":[67],"B\u00fcchi":[68],"automata":[69],"instead":[70],"traditional":[73],"Rabin":[74],"automata;":[75],"choice":[77],"sidesteps":[78],"difficulties":[79],"have":[81],"marred":[82],"previous":[83],"proposals.":[84],"Our":[85],"approach":[86],"allows":[87],"us":[88],"apply":[90],"model-free,":[91],"off-the-shelf":[92],"algorithms":[95],"compute":[97],"optimal":[98],"strategies":[99],"observations":[102],"MDP.":[105],"experimental":[109],"evaluation":[110],"our":[112],"on":[114],"benchmark":[115],"problems.":[117]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":23},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":31},{"year":2020,"cited_by_count":21},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
