{"id":"https://openalex.org/W3081659697","doi":"https://doi.org/10.1109/ijcnn48605.2020.9206758","title":"A Structure of Restricted Boltzmann Machine for Modeling System Dynamics","display_name":"A Structure of Restricted Boltzmann Machine for Modeling System Dynamics","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3081659697","doi":"https://doi.org/10.1109/ijcnn48605.2020.9206758","mag":"3081659697"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9206758","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9206758","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://inria.hal.science/hal-02925519","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027148445","display_name":"Guillaume Padiolleau","orcid":null},"institutions":[{"id":"https://openalex.org/I129235615","display_name":"CEA CESTA","ror":"https://ror.org/026ma2c10","country_code":"FR","type":"government","lineage":["https://openalex.org/I129235615","https://openalex.org/I4210101455"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I15057530","display_name":"Universit\u00e9 de Bordeaux","ror":"https://ror.org/057qpr032","country_code":"FR","type":"education","lineage":["https://openalex.org/I15057530"]},{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I4210087077","display_name":"Institut des Maladies Neurod\u00e9g\u00e9n\u00e9ratives","ror":"https://ror.org/001695n52","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I15057530","https://openalex.org/I4210087077","https://openalex.org/I4210096427"]},{"id":"https://openalex.org/I4210131512","display_name":"Centre Inria de l'universit\u00e9 de Bordeaux","ror":"https://ror.org/03tjcj052","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210131512"]},{"id":"https://openalex.org/I4210142254","display_name":"Laboratoire Bordelais de Recherche en Informatique","ror":"https://ror.org/03adqg323","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I15057530","https://openalex.org/I4210142254","https://openalex.org/I4210159245","https://openalex.org/I4210160189"]},{"id":"https://openalex.org/I4210160189","display_name":"Institut Polytechnique de Bordeaux","ror":"https://ror.org/054qv7y42","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210160189"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Guillaume Padiolleau","raw_affiliation_strings":["CEA-CESTA, Le Barp, France","IMN, Universit\u00e9 de Bordeaux, CNRS, Bordeaux, France","INRIA Bordeaux Sud-Ouest, Talence, France","LaBRI, Universit\u00e9 de Bordeaux, Bordeaux INP, CNRS, Talence, France"],"affiliations":[{"raw_affiliation_string":"CEA-CESTA, Le Barp, France","institution_ids":["https://openalex.org/I129235615","https://openalex.org/I2738703131"]},{"raw_affiliation_string":"IMN, Universit\u00e9 de Bordeaux, CNRS, Bordeaux, France","institution_ids":["https://openalex.org/I4210087077","https://openalex.org/I1294671590","https://openalex.org/I15057530"]},{"raw_affiliation_string":"INRIA Bordeaux Sud-Ouest, Talence, France","institution_ids":["https://openalex.org/I4210131512","https://openalex.org/I1326498283"]},{"raw_affiliation_string":"LaBRI, Universit\u00e9 de Bordeaux, Bordeaux INP, CNRS, Talence, France","institution_ids":["https://openalex.org/I4210142254","https://openalex.org/I4210160189","https://openalex.org/I15057530","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064474867","display_name":"Olivier Bach","orcid":null},"institutions":[{"id":"https://openalex.org/I129235615","display_name":"CEA CESTA","ror":"https://ror.org/026ma2c10","country_code":"FR","type":"government","lineage":["https://openalex.org/I129235615","https://openalex.org/I4210101455"]},{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Olivier Bach","raw_affiliation_strings":["CEA-CESTA, Le Barp, France"],"affiliations":[{"raw_affiliation_string":"CEA-CESTA, Le Barp, France","institution_ids":["https://openalex.org/I129235615","https://openalex.org/I2738703131"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047630010","display_name":"Alain Hugget","orcid":null},"institutions":[{"id":"https://openalex.org/I129235615","display_name":"CEA CESTA","ror":"https://ror.org/026ma2c10","country_code":"FR","type":"government","lineage":["https://openalex.org/I129235615","https://openalex.org/I4210101455"]},{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Alain Hugget","raw_affiliation_strings":["CEA-CESTA, Le Barp, France"],"affiliations":[{"raw_affiliation_string":"CEA-CESTA, Le Barp, France","institution_ids":["https://openalex.org/I129235615","https://openalex.org/I2738703131"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071329791","display_name":"D. Penninckx","orcid":"https://orcid.org/0009-0007-3407-0823"},"institutions":[{"id":"https://openalex.org/I129235615","display_name":"CEA CESTA","ror":"https://ror.org/026ma2c10","country_code":"FR","type":"government","lineage":["https://openalex.org/I129235615","https://openalex.org/I4210101455"]},{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Denis Penninckx","raw_affiliation_strings":["CEA-CESTA, Le Barp, France"],"affiliations":[{"raw_affiliation_string":"CEA-CESTA, Le Barp, France","institution_ids":["https://openalex.org/I129235615","https://openalex.org/I2738703131"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073820572","display_name":"Fr\u00e9d\u00e9ric Alexandre","orcid":"https://orcid.org/0000-0002-6113-1878"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I15057530","display_name":"Universit\u00e9 de Bordeaux","ror":"https://ror.org/057qpr032","country_code":"FR","type":"education","lineage":["https://openalex.org/I15057530"]},{"id":"https://openalex.org/I4210087077","display_name":"Institut des Maladies Neurod\u00e9g\u00e9n\u00e9ratives","ror":"https://ror.org/001695n52","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I15057530","https://openalex.org/I4210087077","https://openalex.org/I4210096427"]},{"id":"https://openalex.org/I4210131512","display_name":"Centre Inria de l'universit\u00e9 de Bordeaux","ror":"https://ror.org/03tjcj052","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210131512"]},{"id":"https://openalex.org/I4210142254","display_name":"Laboratoire Bordelais de Recherche en Informatique","ror":"https://ror.org/03adqg323","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I15057530","https://openalex.org/I4210142254","https://openalex.org/I4210159245","https://openalex.org/I4210160189"]},{"id":"https://openalex.org/I4210160189","display_name":"Institut Polytechnique de Bordeaux","ror":"https://ror.org/054qv7y42","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210160189"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Frederic Alexandre","raw_affiliation_strings":["IMN, Universit\u00e9 de Bordeaux, CNRS, Bordeaux, France","INRIA Bordeaux Sud-Ouest, Talence, France","LaBRI, Universit\u00e9 de Bordeaux, Bordeaux INP, CNRS, Talence, France"],"affiliations":[{"raw_affiliation_string":"IMN, Universit\u00e9 de Bordeaux, CNRS, Bordeaux, France","institution_ids":["https://openalex.org/I4210087077","https://openalex.org/I1294671590","https://openalex.org/I15057530"]},{"raw_affiliation_string":"INRIA Bordeaux Sud-Ouest, Talence, France","institution_ids":["https://openalex.org/I4210131512","https://openalex.org/I1326498283"]},{"raw_affiliation_string":"LaBRI, Universit\u00e9 de Bordeaux, Bordeaux INP, CNRS, Talence, France","institution_ids":["https://openalex.org/I4210142254","https://openalex.org/I4210160189","https://openalex.org/I15057530","https://openalex.org/I1294671590"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5027148445"],"corresponding_institution_ids":["https://openalex.org/I129235615","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I15057530","https://openalex.org/I2738703131","https://openalex.org/I4210087077","https://openalex.org/I4210131512","https://openalex.org/I4210142254","https://openalex.org/I4210160189"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10487335,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"15","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6608361601829529},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6544820666313171},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6143054366111755},{"id":"https://openalex.org/keywords/restricted-boltzmann-machine","display_name":"Restricted Boltzmann machine","score":0.5871272683143616},{"id":"https://openalex.org/keywords/boltzmann-machine","display_name":"Boltzmann machine","score":0.5781934857368469},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5748754143714905},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.5195253491401672},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.46539342403411865},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4578610062599182},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.45297685265541077},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4434671998023987},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3979763388633728},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3436626195907593},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10711014270782471}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6608361601829529},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6544820666313171},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6143054366111755},{"id":"https://openalex.org/C199354608","wikidata":"https://www.wikidata.org/wiki/Q7316287","display_name":"Restricted Boltzmann machine","level":3,"score":0.5871272683143616},{"id":"https://openalex.org/C192576344","wikidata":"https://www.wikidata.org/wiki/Q194706","display_name":"Boltzmann machine","level":3,"score":0.5781934857368469},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5748754143714905},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.5195253491401672},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.46539342403411865},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4578610062599182},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.45297685265541077},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4434671998023987},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3979763388633728},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3436626195907593},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10711014270782471},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9206758","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9206758","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-02925519v1","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-02925519","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IJCNN 2020 - International Joint Conference on Neural Networks, IEEE, Jul 2020, Glasgow, United Kingdom. pp.8","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-02925519v1","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-02925519","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IJCNN 2020 - International Joint Conference on Neural Networks, IEEE, Jul 2020, Glasgow, United Kingdom. pp.8","raw_type":"Conference papers"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W44815768","https://openalex.org/W142185896","https://openalex.org/W1495672967","https://openalex.org/W1511867968","https://openalex.org/W1697053819","https://openalex.org/W2021202584","https://openalex.org/W2048586760","https://openalex.org/W2101524054","https://openalex.org/W2115096495","https://openalex.org/W2116064496","https://openalex.org/W2116825644","https://openalex.org/W2120190345","https://openalex.org/W2136163184","https://openalex.org/W2150529939","https://openalex.org/W2158164339","https://openalex.org/W2160115902","https://openalex.org/W2165225968","https://openalex.org/W2567455162","https://openalex.org/W2787666871","https://openalex.org/W2799245749","https://openalex.org/W2962977065","https://openalex.org/W2963375351","https://openalex.org/W2963523627","https://openalex.org/W6605753235","https://openalex.org/W6629584833","https://openalex.org/W6630657659","https://openalex.org/W6637189935","https://openalex.org/W6683128514","https://openalex.org/W6684349851","https://openalex.org/W6750253780","https://openalex.org/W6750453880","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W4283272532","https://openalex.org/W2952018105","https://openalex.org/W2119341610","https://openalex.org/W2916681395","https://openalex.org/W2556473569","https://openalex.org/W2193475944","https://openalex.org/W4302433642","https://openalex.org/W2529583158","https://openalex.org/W3104798141","https://openalex.org/W2523796918"],"abstract_inverted_index":{"This":[0],"paper":[1,192],"presents":[2],"a":[3,39,101],"new":[4],"approach":[5],"for":[6,15,64,113,135,160],"learning":[7,13,114,153,161,196],"transition":[8,31,46,79,133,216],"function":[9,217],"in":[10,151,176,190,221],"state":[11,30],"representation":[12,69],"(SRL)":[14],"control.":[16],"While":[17],"state-of-the-art":[18],"methods":[19],"use":[20,100],"different":[21,157],"deterministic":[22],"neural":[23],"networks":[24],"to":[25,43,66,76,168,173,184,213],"learn":[26,44,77,214],"forward":[27],"and":[28,90,117,149,218],"inverse":[29],"functions":[32,80],"independently":[33],"with":[34,110,119],"auto-supervised":[35],"learning,":[36],"we":[37,193],"introduce":[38],"bidirectional":[40,132,215],"stochastic":[41],"model":[42,56,75,134,163],"both":[45,78],"functions.":[47],"We":[48,99,155,205],"aim":[49],"at":[50],"using":[51,72],"the":[52,55,68,73,83,93,97,128,131,162,199,208],"uncertainty":[53],"of":[54,96,130,187],"on":[57,126,195],"its":[58],"predictions":[59],"as":[60],"an":[61],"intrinsic":[62],"motivation":[63],"exploration":[65],"enhance":[67],"learning.":[70,137],"More,":[71],"same":[74],"allows":[81],"sharing":[82],"parameters,":[84],"which":[85],"can":[86],"reduce":[87],"their":[88],"number":[89],"should":[91],"increase":[92],"embedding":[94],"quality":[95],"representation.":[98],"factored":[102],"restricted":[103,183],"Boltzmann":[104],"machine":[105],"(fRBM)":[106],"based":[107],"model,":[108],"enhanced":[109],"dedicated":[111],"structure":[112,129,140,180,210],"system":[115],"dynamics":[116,197],"transitions":[118],"shared":[120],"parameters.":[121],"The":[122],"presented":[123],"work":[124],"focuses":[125],"building":[127],"unsupervised":[136],"Our":[138,179],"fRBM":[139],"is":[141,181,211],"directly":[142],"inspired":[143],"from":[144,198],"physics":[145],"interactions":[146],"between":[147],"inputs":[148],"outputs":[150],"reinforcement":[152],"framework.":[154,178],"compare":[156],"training":[158],"algorithms":[159],"that":[164,207],"must":[165],"be":[166,174],"able":[167,212],"predict":[169],"observable":[170],"random":[171],"variables":[172],"used":[175],"SRL":[177],"not":[182],"any":[185],"type":[186],"observable,":[188],"nevertheless":[189],"this":[191],"focus":[194],"OpenAI":[200],"Gym":[201],"environment":[202],"Swinging":[203],"Pendulum.":[204],"show":[206],"proposed":[209],"performs":[219],"well":[220],"prediction":[222],"task.":[223]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
