{"id":"https://openalex.org/W4409979384","doi":"https://doi.org/10.1007/978-3-031-90900-9_7","title":"Symbolic State Partitioning for Reinforcement Learning","display_name":"Symbolic State Partitioning for Reinforcement Learning","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409979384","doi":"https://doi.org/10.1007/978-3-031-90900-9_7"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-031-90900-9_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-90900-9_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-90900-9_7.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-90900-9_7.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088284921","display_name":"Mohsen Ghaffari","orcid":"https://orcid.org/0000-0002-1939-9053"},"institutions":[{"id":"https://openalex.org/I83467386","display_name":"IT University of Copenhagen","ror":"https://ror.org/02309jg23","country_code":"DK","type":"education","lineage":["https://openalex.org/I83467386"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Mohsen Ghaffari","raw_affiliation_strings":["ITU, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0002-1939-9053","affiliations":[{"raw_affiliation_string":"ITU, Copenhagen, Denmark","institution_ids":["https://openalex.org/I83467386"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036805687","display_name":"Mahsa Varshosaz","orcid":"https://orcid.org/0000-0002-4776-883X"},"institutions":[{"id":"https://openalex.org/I83467386","display_name":"IT University of Copenhagen","ror":"https://ror.org/02309jg23","country_code":"DK","type":"education","lineage":["https://openalex.org/I83467386"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Mahsa Varshosaz","raw_affiliation_strings":["ITU, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0002-4776-883X","affiliations":[{"raw_affiliation_string":"ITU, Copenhagen, Denmark","institution_ids":["https://openalex.org/I83467386"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039414480","display_name":"Einar Broch Johnsen","orcid":"https://orcid.org/0000-0001-5382-3949"},"institutions":[{"id":"https://openalex.org/I184942183","display_name":"University of Oslo","ror":"https://ror.org/01xtthb56","country_code":"NO","type":"education","lineage":["https://openalex.org/I184942183"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Einar Broch Johnsen","raw_affiliation_strings":["University of Oslo, Oslo, Norway"],"raw_orcid":"https://orcid.org/0000-0001-5382-3949","affiliations":[{"raw_affiliation_string":"University of Oslo, Oslo, Norway","institution_ids":["https://openalex.org/I184942183"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056755949","display_name":"Andrzej W\u0105sowski","orcid":"https://orcid.org/0000-0003-0532-2685"},"institutions":[{"id":"https://openalex.org/I83467386","display_name":"IT University of Copenhagen","ror":"https://ror.org/02309jg23","country_code":"DK","type":"education","lineage":["https://openalex.org/I83467386"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Andrzej W\u0105sowski","raw_affiliation_strings":["ITU, Copenhagen, Denmark"],"raw_orcid":"https://orcid.org/0000-0003-0532-2685","affiliations":[{"raw_affiliation_string":"ITU, Copenhagen, Denmark","institution_ids":["https://openalex.org/I83467386"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5088284921"],"corresponding_institution_ids":["https://openalex.org/I83467386"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":4.1459,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.9135568,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"122","last_page":"144"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8583450317382812},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7360036969184875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4611288607120514},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.45668211579322815},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.40647679567337036},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.32438671588897705}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8583450317382812},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7360036969184875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4611288607120514},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.45668211579322815},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40647679567337036},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.32438671588897705}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-031-90900-9_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-90900-9_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-90900-9_7.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.1007/978-3-031-90900-9_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-90900-9_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-90900-9_7.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320313796","display_name":"Innovationsfonden","ror":"https://ror.org/00daj4111"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409979384.pdf","grobid_xml":"https://content.openalex.org/works/W4409979384.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W111328409","https://openalex.org/W113028485","https://openalex.org/W1480909796","https://openalex.org/W1977655452","https://openalex.org/W1989407213","https://openalex.org/W1992094515","https://openalex.org/W1995688924","https://openalex.org/W1998768278","https://openalex.org/W2012997183","https://openalex.org/W2047184747","https://openalex.org/W2061686717","https://openalex.org/W2078727257","https://openalex.org/W2078988604","https://openalex.org/W2084838588","https://openalex.org/W2101512909","https://openalex.org/W2142484475","https://openalex.org/W2161290831","https://openalex.org/W2166280160","https://openalex.org/W2565255124","https://openalex.org/W2787908307","https://openalex.org/W2888752104","https://openalex.org/W2899685447","https://openalex.org/W2911169848","https://openalex.org/W2949019968","https://openalex.org/W2980176594","https://openalex.org/W2981739602","https://openalex.org/W2982316166","https://openalex.org/W2998004401","https://openalex.org/W3082925502","https://openalex.org/W3114989226","https://openalex.org/W3132151609","https://openalex.org/W3185816745","https://openalex.org/W3186158026","https://openalex.org/W3216656735","https://openalex.org/W4285022787","https://openalex.org/W4290087551","https://openalex.org/W4313145652","https://openalex.org/W4366967222","https://openalex.org/W4385301039","https://openalex.org/W4386317039","https://openalex.org/W4386746422","https://openalex.org/W6601339314","https://openalex.org/W6629075127","https://openalex.org/W6814003322"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2964765435"],"abstract_inverted_index":{"Abstract":[0],"Tabular":[1],"reinforcement":[2,114],"learning":[3,29,39,115,133],"methods":[4],"cannot":[5],"operate":[6],"directly":[7],"on":[8],"continuous":[9],"state":[10,21,63,81,104,125,137],"spaces.":[11],"One":[12],"solution":[13],"to":[14,18,109,116,130],"this":[15],"problem":[16],"is":[17,53],"partition":[19,67],"the":[20,38,57,76,80,84,92,141],"space.":[22],"A":[23],"good":[24],"partitioning":[25,49,102,127],"enables":[26],"generalization":[27],"during":[28],"and":[30,43,112,136],"more":[31,45],"efficient":[32],"exploitation":[33],"of":[34,59,79],"prior":[35],"experiences.":[36],"Consequently,":[37],"process":[40],"becomes":[41],"faster":[42],"produces":[44],"reliable":[46],"policies.":[47,143],"However,":[48],"introduces":[50],"approximation,":[51],"which":[52],"particularly":[54],"harmful":[55],"in":[56],"presence":[58],"nonlinear":[60],"relations":[61],"between":[62],"components.":[64],"An":[65],"ideal":[66],"should":[68],"be":[69],"as":[70,72],"coarse":[71],"possible,":[73],"while":[74],"capturing":[75],"key":[77],"structure":[78],"space":[82,105,126,138],"for":[83,119,140],"given":[85],"problem.":[86],"This":[87],"work":[88],"extracts":[89],"partitions":[90],"from":[91],"environment":[93],"dynamics":[94],"by":[95],"symbolic":[96,101,124],"execution.":[97],"We":[98,122],"show":[99],"that":[100],"improves":[103],"coverage":[106,139],"with":[107,128],"respect":[108,129],"environmental":[110],"behavior":[111],"allows":[113],"perform":[117],"better":[118],"sparse":[120],"rewards.":[121],"evaluate":[123],"precision,":[131],"scalability,":[132],"agent":[134],"performance":[135],"learned":[142]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
