{"id":"https://openalex.org/W4382319487","doi":"https://doi.org/10.1093/logcom/exad032","title":"Extension of constraint-procedural logic-generated environments for deep Q-learning agent training and benchmarking","display_name":"Extension of constraint-procedural logic-generated environments for deep Q-learning agent training and benchmarking","publication_year":2023,"publication_date":"2023-06-07","ids":{"openalex":"https://openalex.org/W4382319487","doi":"https://doi.org/10.1093/logcom/exad032"},"language":"en","primary_location":{"id":"doi:10.1093/logcom/exad032","is_oa":false,"landing_page_url":"https://doi.org/10.1093/logcom/exad032","pdf_url":null,"source":{"id":"https://openalex.org/S47057106","display_name":"Journal of Logic and Computation","issn_l":"0955-792X","issn":["0955-792X","1465-363X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Logic and Computation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023765348","display_name":"Giovanni De Gasperis","orcid":"https://orcid.org/0000-0001-9521-4711"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Giovanni De Gasperis","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021862093","display_name":"Stefania Costantini","orcid":"https://orcid.org/0000-0002-5686-6124"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Stefania Costantini","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092123219","display_name":"Andrea Rafanelli","orcid":"https://orcid.org/0000-0001-8626-2121"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]},{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Rafanelli","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy, Department of Computer Science, University of Pisa, Largo B. Pontecorvo, Pisa, 57127, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy, Department of Computer Science, University of Pisa, Largo B. Pontecorvo, Pisa, 57127, Italy","institution_ids":["https://openalex.org/I26415053","https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058247188","display_name":"Patrizio Migliarini","orcid":"https://orcid.org/0000-0002-7824-529X"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Patrizio Migliarini","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014004028","display_name":"Ivan Letteri","orcid":"https://orcid.org/0000-0002-3843-386X"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Ivan Letteri","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012714475","display_name":"Abeer Dyoub","orcid":"https://orcid.org/0000-0003-0329-2419"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Abeer Dyoub","raw_affiliation_strings":["Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Computer Science and Mathematics, University of L\u2019Aquila , Via Vetoio, L\u2019Aquila, 67100, Italy","institution_ids":["https://openalex.org/I26415053"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5023765348"],"corresponding_institution_ids":["https://openalex.org/I26415053"],"apc_list":{"value":4151,"currency":"USD","value_usd":4151},"apc_paid":null,"fwci":0.6627,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.74548863,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"33","issue":"8","first_page":"1712","last_page":"1733"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9693999886512756,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7776898741722107},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.5836416482925415},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5723717212677002},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5717292428016663},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5648173093795776},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5267089009284973},{"id":"https://openalex.org/keywords/constraint-programming","display_name":"Constraint programming","score":0.45139405131340027},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.430713415145874},{"id":"https://openalex.org/keywords/prolog","display_name":"Prolog","score":0.4138683080673218},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4107740521430969},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.37378454208374023},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.34292152523994446}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7776898741722107},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.5836416482925415},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5723717212677002},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5717292428016663},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5648173093795776},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5267089009284973},{"id":"https://openalex.org/C173404611","wikidata":"https://www.wikidata.org/wiki/Q528588","display_name":"Constraint programming","level":3,"score":0.45139405131340027},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.430713415145874},{"id":"https://openalex.org/C81721847","wikidata":"https://www.wikidata.org/wiki/Q163468","display_name":"Prolog","level":2,"score":0.4138683080673218},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4107740521430969},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.37378454208374023},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34292152523994446},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C137631369","wikidata":"https://www.wikidata.org/wiki/Q7617831","display_name":"Stochastic programming","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1093/logcom/exad032","is_oa":false,"landing_page_url":"https://doi.org/10.1093/logcom/exad032","pdf_url":null,"source":{"id":"https://openalex.org/S47057106","display_name":"Journal of Logic and Computation","issn_l":"0955-792X","issn":["0955-792X","1465-363X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Logic and Computation","raw_type":"journal-article"},{"id":"pmh:oai:arpi.unipi.it:11568/1275172","is_oa":false,"landing_page_url":"https://hdl.handle.net/11568/1275172","pdf_url":null,"source":{"id":"https://openalex.org/S4377196265","display_name":"CINECA IRIS Institutial research information system (University of Pisa)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I108290504","host_organization_name":"University of Pisa","host_organization_lineage":["https://openalex.org/I108290504"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1522301498","https://openalex.org/W1549847324","https://openalex.org/W1595483645","https://openalex.org/W1608309740","https://openalex.org/W2060020482","https://openalex.org/W2060498389","https://openalex.org/W2084202433","https://openalex.org/W2152660354","https://openalex.org/W2397253692","https://openalex.org/W2534314849","https://openalex.org/W2540236031","https://openalex.org/W2746553466","https://openalex.org/W2893641169","https://openalex.org/W2895453875","https://openalex.org/W3111135479","https://openalex.org/W3139145500","https://openalex.org/W4233642774","https://openalex.org/W6600075489","https://openalex.org/W6629756183","https://openalex.org/W6629861747","https://openalex.org/W6631190155","https://openalex.org/W6636725810","https://openalex.org/W6678706456","https://openalex.org/W6696816106","https://openalex.org/W6713101361","https://openalex.org/W6730942930","https://openalex.org/W6754957883"],"related_works":["https://openalex.org/W2341492732","https://openalex.org/W3187193180","https://openalex.org/W106542691","https://openalex.org/W1596719193","https://openalex.org/W2365168741","https://openalex.org/W2510050445","https://openalex.org/W2963869083","https://openalex.org/W1591778271","https://openalex.org/W1591583250","https://openalex.org/W2525470665"],"abstract_inverted_index":{"Abstract":[0],"Autonomous":[1],"robots":[2],"can":[3],"be":[4],"employed":[5],"in":[6,72,79,145,174,197,207,249],"exploring":[7],"unknown":[8],"environments":[9,42],"and":[10,56,83,264,279],"performing":[11],"many":[12],"tasks,":[13],"such":[14],"as,":[15],"e.g.":[16],"detecting":[17],"areas":[18],"of":[19,36,52,81,99,107,110,122,138,163,252,268,286],"interest,":[20],"collecting":[21],"target":[22],"objects,":[23],"etc.":[24],"Deep":[25],"reinforcement":[26],"learning":[27],"(RL)":[28],"is":[29,49,60,71,166,280],"often":[30],"used":[31],"to":[32,62,86,114,157,200,216,222,239,261,263,282],"train":[33],"this":[34,100,148],"kind":[35],"robot.":[37],"However,":[38],"concerning":[39],"the":[40,46,88,92,96,105,108,111,120,126,136,164,170,189,208,211,214,241,244,253,259,269,284,287],"artificial":[41],"aimed":[43],"at":[44],"testing":[45,169],"robot,":[47],"there":[48],"a":[50,57,116,153,184,204,218,225,231,250],"lack":[51],"available":[53],"data":[54,69,117,140,172],"sets":[55,141],"long":[58],"time":[59],"needed":[61,113],"create":[63],"them":[64],"from":[65,188],"scratch.":[66],"A":[67,192,235],"good":[68],"set":[70,173],"fact":[73],"usually":[74],"produced":[75],"with":[76,276],"high":[77],"effort":[78],"terms":[80],"cost":[82],"human":[84],"work":[85],"satisfy":[87],"constraints":[89],"imposed":[90],"by":[91],"expected":[93],"results.":[94],"In":[95,125,147],"first":[97],"part":[98,162,251],"paper,":[101],"we":[102,134],"focus":[103],"on":[104,168],"specification":[106],"properties":[109],"solutions":[112],"build":[115],"set,":[118],"making":[119],"case":[121],"environment":[123,155,221],"exploration.":[124],"proposed":[127],"approach,":[128],"rather":[129],"than":[130],"using":[131,142],"imperative":[132],"programming,":[133],"explore":[135,217,265],"possibility":[137],"generating":[139],"constraint":[143],"programming":[144],"Prolog.":[146],"phase,":[149],"geometric":[150],"predicates":[151],"describe":[152],"virtual":[154,209,220,254],"according":[156],"inter-space":[158],"requirements.":[159],"The":[160],"second":[161],"paper":[165],"focused":[167],"generated":[171,219],"an":[175],"AI":[176],"gym":[177],"via":[178,202],"space":[179],"search":[180,205,242],"techniques.":[181],"We":[182],"developed":[183],"Neuro-Symbolic":[185],"agent":[186,212,260],"built":[187],"following:":[190],"(i)":[191],"deep":[193],"Q-learning":[194,245],"component":[195,237,246],"implemented":[196],"Python,":[198],"able":[199,238],"address":[201],"RL":[203,232],"problem":[206],"space;":[210],"has":[213,273],"goal":[215],"seek":[223],"for":[224],"target,":[226],"improving":[227],"its":[228],"performance":[229],"through":[230],"process.":[233],"(ii)":[234],"symbolic":[236],"re-address":[240],"when":[243],"gets":[247],"stuck":[248],"environment;":[255],"these":[256],"components":[257],"stimulate":[258],"move":[262],"other":[266],"parts":[267],"environment.":[270],"Wide":[271],"experimentation":[272],"been":[274],"performed,":[275],"promising":[277],"results,":[278],"reported,":[281],"demonstrate":[283],"effectiveness":[285],"approach.":[288]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
