{"id":"https://openalex.org/W2923682622","doi":"https://doi.org/10.1109/access.2021.3119000","title":"Symbolic Regression Methods for Reinforcement Learning","display_name":"Symbolic Regression Methods for Reinforcement Learning","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W2923682622","doi":"https://doi.org/10.1109/access.2021.3119000","mag":"2923682622"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3119000","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119000","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09565900.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09565900.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004892921","display_name":"Ji\u0159\u0131\u0301 Kubal\u0131\u0301k","orcid":"https://orcid.org/0000-0002-6965-6142"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Jiri Kubalik","raw_affiliation_strings":["Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic","Czech Technical Univ. in Prague"],"raw_orcid":"https://orcid.org/0000-0002-6965-6142","affiliations":[{"raw_affiliation_string":"Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic","institution_ids":["https://openalex.org/I44504214"]},{"raw_affiliation_string":"Czech Technical Univ. in Prague","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033348430","display_name":"Erik Derner","orcid":"https://orcid.org/0000-0002-7588-7668"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Erik Derner","raw_affiliation_strings":["Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic and Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, 16627, Czech Republic. (e-mail: erik.derner@cvut.cz)"],"raw_orcid":"https://orcid.org/0000-0002-7588-7668","affiliations":[{"raw_affiliation_string":"Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic and Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, 16627, Czech Republic. (e-mail: erik.derner@cvut.cz)","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034437054","display_name":"Jan \u017degklitz","orcid":"https://orcid.org/0000-0003-3302-6779"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Jan Zegklitz","raw_affiliation_strings":["Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, 16627, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0003-3302-6779","affiliations":[{"raw_affiliation_string":"Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, 16627, Czech Republic","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084264842","display_name":"Robert Babu\u0161ka","orcid":"https://orcid.org/0000-0001-9578-8598"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Robert Babuska","raw_affiliation_strings":["Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic and Cognitive Robotics, Delft University of Technology, Delft, 2628 CD, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0001-9578-8598","affiliations":[{"raw_affiliation_string":"Czech Institute of Informatics, Robotics, and Cybernetics, Czech Technical University in Prague, Prague, 16000, Czech Republic and Cognitive Robotics, Delft University of Technology, Delft, 2628 CD, The Netherlands","institution_ids":["https://openalex.org/I44504214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5004892921"],"corresponding_institution_ids":["https://openalex.org/I44504214"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.5597,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.71606716,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"9","issue":null,"first_page":"139697","last_page":"139711"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8485968112945557},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.6822443008422852},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6388574838638306},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5659070014953613},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.47991976141929626},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.45861175656318665},{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function approximation","score":0.4454859495162964},{"id":"https://openalex.org/keywords/state-variable","display_name":"State variable","score":0.4343588948249817},{"id":"https://openalex.org/keywords/pendulum","display_name":"Pendulum","score":0.43262138962745667},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4015757441520691},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.37875235080718994},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.29538074135780334},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2585332989692688}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8485968112945557},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.6822443008422852},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6388574838638306},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5659070014953613},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.47991976141929626},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.45861175656318665},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.4454859495162964},{"id":"https://openalex.org/C129537906","wikidata":"https://www.wikidata.org/wiki/Q7603913","display_name":"State variable","level":2,"score":0.4343588948249817},{"id":"https://openalex.org/C110639684","wikidata":"https://www.wikidata.org/wiki/Q20702","display_name":"Pendulum","level":2,"score":0.43262138962745667},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4015757441520691},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.37875235080718994},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29538074135780334},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2585332989692688},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/access.2021.3119000","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119000","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09565900.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1903.09688","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1903.09688","pdf_url":"https://arxiv.org/pdf/1903.09688","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2923682622","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1903.09688v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:doaj.org/article:b4e237f7c70c40dfbea05c12d51a6c67","is_oa":true,"landing_page_url":"https://doaj.org/article/b4e237f7c70c40dfbea05c12d51a6c67","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 139697-139711 (2021)","raw_type":"article"},{"id":"pmh:oai:tudelft.nl:uuid:02411602-2f70-4deb-8ede-29f98ff8f91b","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:02411602-2f70-4deb-8ede-29f98ff8f91b","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"journal article"},{"id":"doi:10.48550/arxiv.1903.09688","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1903.09688","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3119000","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119000","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09565900.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.8299999833106995}],"awards":[{"id":"https://openalex.org/G12500569","display_name":null,"funder_award_id":"CZ.02.1.01/0.0","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G176604203","display_name":null,"funder_award_id":"02.1.01/0.0/0.0","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G291036901","display_name":null,"funder_award_id":"CZ.02","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G3490171961","display_name":null,"funder_award_id":"CZ.02.1.01","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G3593829383","display_name":null,"funder_award_id":"SGS19/174/OHK3/3T/13","funder_id":"https://openalex.org/F4320309972","funder_display_name":"\u010cesk\u00e9 Vysok\u00e9 U\u010den\u00ed Technick\u00e9 v Praze"},{"id":"https://openalex.org/G4131035492","display_name":null,"funder_award_id":"CZ.02.1.01","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G5916014575","display_name":null,"funder_award_id":"CZ.02.1.01/0.0/0.0","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G6594491356","display_name":null,"funder_award_id":"CZ.02.1.01/0.0/0.0/","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G7466461085","display_name":null,"funder_award_id":"15-22731S","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G8087443690","display_name":null,"funder_award_id":"CZ.02.1.01/0.0/0.0/15_003/0000470","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"}],"funders":[{"id":"https://openalex.org/F4320309972","display_name":"\u010cesk\u00e9 Vysok\u00e9 U\u010den\u00ed Technick\u00e9 v Praze","ror":"https://ror.org/03kqpb082"},{"id":"https://openalex.org/F4320321006","display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky","ror":"https://ror.org/01pv73b02"},{"id":"https://openalex.org/F4320335322","display_name":"European Regional Development Fund","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2923682622.pdf","grobid_xml":"https://content.openalex.org/works/W2923682622.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W102487131","https://openalex.org/W197747737","https://openalex.org/W1542000206","https://openalex.org/W1552830313","https://openalex.org/W1626155273","https://openalex.org/W1689445748","https://openalex.org/W1757796397","https://openalex.org/W1966086707","https://openalex.org/W1968962398","https://openalex.org/W1979769287","https://openalex.org/W1991542861","https://openalex.org/W2014337138","https://openalex.org/W2059396387","https://openalex.org/W2064364553","https://openalex.org/W2068823081","https://openalex.org/W2108051346","https://openalex.org/W2110608082","https://openalex.org/W2120346334","https://openalex.org/W2121863487","https://openalex.org/W2136495462","https://openalex.org/W2145339207","https://openalex.org/W2173248099","https://openalex.org/W2483158547","https://openalex.org/W2509705549","https://openalex.org/W2570076534","https://openalex.org/W2729625880","https://openalex.org/W2735901402","https://openalex.org/W2769736739","https://openalex.org/W2783396564","https://openalex.org/W2783456932","https://openalex.org/W2892979040","https://openalex.org/W2954765142","https://openalex.org/W2963672746","https://openalex.org/W2963773324","https://openalex.org/W3010868305","https://openalex.org/W3016401366","https://openalex.org/W3017946098","https://openalex.org/W3038264455","https://openalex.org/W3106411828","https://openalex.org/W3156202422","https://openalex.org/W6637967152","https://openalex.org/W6656412206","https://openalex.org/W6677737365","https://openalex.org/W6684921986","https://openalex.org/W6763291914","https://openalex.org/W6775039030"],"related_works":["https://openalex.org/W3206768895","https://openalex.org/W2294727673","https://openalex.org/W3172704282","https://openalex.org/W2110422826","https://openalex.org/W2924194835","https://openalex.org/W2189252197","https://openalex.org/W2187753657","https://openalex.org/W2145756561","https://openalex.org/W3012520197","https://openalex.org/W2310813700","https://openalex.org/W3196070124","https://openalex.org/W3173370172","https://openalex.org/W2804606950","https://openalex.org/W2078246718","https://openalex.org/W2798418464","https://openalex.org/W2319967243","https://openalex.org/W2107880645","https://openalex.org/W1509570633","https://openalex.org/W606274623","https://openalex.org/W3036320002"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,21],"algorithms":[2,22],"can":[3],"be":[4],"used":[5,37],"to":[6,28,82,168],"optimally":[7],"solve":[8],"dynamic":[9],"decision-making":[10],"and":[11,17,33,63,68,119,141,145,166],"control":[12,134,137],"problems.":[13],"With":[14],"continuous-valued":[15],"state":[16,110],"input":[18],"variables,":[19],"reinforcement":[20],"must":[23],"rely":[24],"on":[25,108,131],"function":[26,32,46],"approximators":[27],"represent":[29],"the":[30,60,88,124,152,182,199],"value":[31,85,105,114,153],"policy":[34,117],"mappings.":[35],"Commonly":[36],"numerical":[38],"approximators,":[39],"such":[40],"as":[41],"neural":[42,192,200],"networks":[43,193],"or":[44],"basis":[45],"expansions,":[47],"have":[48],"two":[49],"main":[50],"drawbacks:":[51],"they":[52,64],"are":[53,129,162],"black-box":[54],"models":[55],"offering":[56],"no":[57],"insight":[58],"in":[59,87],"mappings":[61],"learned,":[62],"require":[65],"significant":[66],"trial":[67],"error":[69],"tuning":[70],"of":[71,90,95,123,181],"their":[72],"meta-parameters.":[73],"In":[74],"this":[75],"paper,":[76],"we":[77],"propose":[78],"a":[79,109,120],"new":[80],"approach":[81,190],"constructing":[83],"smooth":[84],"functions":[86,106,154],"form":[89],"analytic":[91],"expressions":[92],"by":[93],"means":[94],"symbolic":[96,113,116],"regression.":[97],"We":[98],"introduce":[99],"three":[100],"off-line":[101],"methods":[102,128],"for":[103,178],"finding":[104],"based":[107],"transition":[111],"model:":[112],"iteration,":[115,118],"direct":[121],"solution":[122],"Bellman":[125],"equation.":[126],"The":[127,148],"illustrated":[130],"four":[132],"nonlinear":[133],"problems:":[135],"velocity":[136],"under":[138],"friction,":[139],"one-link":[140],"two-link":[142],"pendulum":[143],"swing-up,":[144],"magnetic":[146],"manipulation.":[147],"results":[149],"show":[150],"that":[151,195],"not":[155],"only":[156],"yield":[157],"well-performing":[158],"policies,":[159],"but":[160],"also":[161],"compact,":[163],"mathematically":[164],"tractable":[165],"easy":[167],"plug":[169],"into":[170],"other":[171],"algorithms.":[172],"This":[173],"makes":[174],"them":[175],"potentially":[176],"suitable":[177],"further":[179],"analysis":[180],"closed-loop":[183],"system.":[184],"A":[185],"comparison":[186],"with":[187],"an":[188],"alternative":[189],"using":[191],"shows":[194],"our":[196],"method":[197],"outperforms":[198],"network-based":[201],"one.":[202]},"counts_by_year":[{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2019-04-01T00:00:00"}
