{"id":"https://openalex.org/W3215482237","doi":"https://doi.org/10.1109/icra46639.2022.9811993","title":"Value learning from trajectory optimization and Sobolev descent: A step toward reinforcement learning with superlinear convergence properties","display_name":"Value learning from trajectory optimization and Sobolev descent: A step toward reinforcement learning with superlinear convergence properties","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W3215482237","doi":"https://doi.org/10.1109/icra46639.2022.9811993","mag":"3215482237"},"language":"en","primary_location":{"id":"doi:10.1109/icra46639.2022.9811993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9811993","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008531364","display_name":"Amit Parag","orcid":null},"institutions":[{"id":"https://openalex.org/I84500057","display_name":"Institut de Math\u00e9matiques de Toulouse","ror":"https://ror.org/014vp6c30","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I196454796","https://openalex.org/I4210141950","https://openalex.org/I4210152422","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405259414","https://openalex.org/I84500057"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210098964","display_name":"Toulouse Mathematics Institute","ror":null,"country_code":"FR","type":null,"lineage":["https://openalex.org/I4210098964"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Amit Parag","raw_affiliation_strings":["Artificial and Natural Intelligence Toulouse Institute,France","LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","Artificial and Natural Intelligence Toulouse Institute, France"],"affiliations":[{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute,France","institution_ids":["https://openalex.org/I4210098964"]},{"raw_affiliation_string":"LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]},{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute, France","institution_ids":["https://openalex.org/I84500057"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059986525","display_name":"S\u00e9bastien Kleff","orcid":"https://orcid.org/0000-0002-9025-6143"},"institutions":[{"id":"https://openalex.org/I4210098964","display_name":"Toulouse Mathematics Institute","ror":null,"country_code":"FR","type":null,"lineage":["https://openalex.org/I4210098964"]},{"id":"https://openalex.org/I84500057","display_name":"Institut de Math\u00e9matiques de Toulouse","ror":"https://ror.org/014vp6c30","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I196454796","https://openalex.org/I4210141950","https://openalex.org/I4210152422","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405259414","https://openalex.org/I84500057"]},{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["FR","US"],"is_corresponding":false,"raw_author_name":"Sebastien Kleff","raw_affiliation_strings":["Artificial and Natural Intelligence Toulouse Institute,France","Artificial and Natural Intelligence Toulouse Institute, France","New York University, USA"],"affiliations":[{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute,France","institution_ids":["https://openalex.org/I4210098964"]},{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute, France","institution_ids":["https://openalex.org/I84500057"]},{"raw_affiliation_string":"New York University, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042182440","display_name":"L\u00e9o Saci","orcid":"https://orcid.org/0000-0002-6957-7823"},"institutions":[{"id":"https://openalex.org/I4210098964","display_name":"Toulouse Mathematics Institute","ror":null,"country_code":"FR","type":null,"lineage":["https://openalex.org/I4210098964"]},{"id":"https://openalex.org/I84500057","display_name":"Institut de Math\u00e9matiques de Toulouse","ror":"https://ror.org/014vp6c30","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I196454796","https://openalex.org/I4210141950","https://openalex.org/I4210152422","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405259414","https://openalex.org/I84500057"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Leo Saci","raw_affiliation_strings":["Artificial and Natural Intelligence Toulouse Institute,France","Artificial and Natural Intelligence Toulouse Institute, France"],"affiliations":[{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute,France","institution_ids":["https://openalex.org/I4210098964"]},{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute, France","institution_ids":["https://openalex.org/I84500057"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046876471","display_name":"Nicolas Mansard","orcid":"https://orcid.org/0000-0002-8090-0601"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I84500057","display_name":"Institut de Math\u00e9matiques de Toulouse","ror":"https://ror.org/014vp6c30","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I196454796","https://openalex.org/I4210141950","https://openalex.org/I4210152422","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405259414","https://openalex.org/I84500057"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I4210098964","display_name":"Toulouse Mathematics Institute","ror":null,"country_code":"FR","type":null,"lineage":["https://openalex.org/I4210098964"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Nicolas Mansard","raw_affiliation_strings":["Artificial and Natural Intelligence Toulouse Institute,France","LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","Artificial and Natural Intelligence Toulouse Institute, France"],"affiliations":[{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute,France","institution_ids":["https://openalex.org/I4210098964"]},{"raw_affiliation_string":"LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]},{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute, France","institution_ids":["https://openalex.org/I84500057"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071048560","display_name":"Olivier Stasse","orcid":"https://orcid.org/0000-0001-8569-6155"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I84500057","display_name":"Institut de Math\u00e9matiques de Toulouse","ror":"https://ror.org/014vp6c30","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I196454796","https://openalex.org/I4210141950","https://openalex.org/I4210152422","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405259414","https://openalex.org/I84500057"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I4210098964","display_name":"Toulouse Mathematics Institute","ror":null,"country_code":"FR","type":null,"lineage":["https://openalex.org/I4210098964"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Olivier Stasse","raw_affiliation_strings":["Artificial and Natural Intelligence Toulouse Institute,France","LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","Artificial and Natural Intelligence Toulouse Institute, France"],"affiliations":[{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute,France","institution_ids":["https://openalex.org/I4210098964"]},{"raw_affiliation_string":"LAAS-CNRS, Universite de Toulouse, CNRS, Toulouse, France","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]},{"raw_affiliation_string":"Artificial and Natural Intelligence Toulouse Institute, France","institution_ids":["https://openalex.org/I84500057"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5008531364"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I17866349","https://openalex.org/I190497903","https://openalex.org/I4210098964","https://openalex.org/I84500057"],"apc_list":null,"apc_paid":null,"fwci":0.6236,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.65540832,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"01","last_page":"07"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12810","display_name":"Real-time simulation and control systems","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.887782096862793},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6725446581840515},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.6713897585868835},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6324989795684814},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5727832317352295},{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function approximation","score":0.5144636631011963},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4840947389602661},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.46483373641967773},{"id":"https://openalex.org/keywords/sobolev-space","display_name":"Sobolev space","score":0.4554634988307953},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43531981110572815},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.42268383502960205},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.22189146280288696},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21237173676490784}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.887782096862793},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6725446581840515},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.6713897585868835},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6324989795684814},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5727832317352295},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.5144636631011963},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4840947389602661},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.46483373641967773},{"id":"https://openalex.org/C99730327","wikidata":"https://www.wikidata.org/wiki/Q1501536","display_name":"Sobolev space","level":2,"score":0.4554634988307953},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43531981110572815},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.42268383502960205},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.22189146280288696},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21237173676490784},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra46639.2022.9811993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9811993","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1533713200","https://openalex.org/W1771410628","https://openalex.org/W1967821692","https://openalex.org/W2092196700","https://openalex.org/W2104920576","https://openalex.org/W2140256637","https://openalex.org/W2145339207","https://openalex.org/W2155007355","https://openalex.org/W2158782408","https://openalex.org/W2163577891","https://openalex.org/W2167856595","https://openalex.org/W2281096776","https://openalex.org/W2295431040","https://openalex.org/W2416477367","https://openalex.org/W2626089772","https://openalex.org/W2764255492","https://openalex.org/W2779458783","https://openalex.org/W2906487027","https://openalex.org/W2907537824","https://openalex.org/W2963165111","https://openalex.org/W2963864421","https://openalex.org/W2964043796","https://openalex.org/W2975504670","https://openalex.org/W2980297602","https://openalex.org/W2981344907","https://openalex.org/W3029641972","https://openalex.org/W3081791272","https://openalex.org/W3177004920","https://openalex.org/W4237591687","https://openalex.org/W4289303873","https://openalex.org/W4293775970","https://openalex.org/W4300309110","https://openalex.org/W6638018090","https://openalex.org/W6675999342","https://openalex.org/W6680666887","https://openalex.org/W6682849425","https://openalex.org/W6684921986","https://openalex.org/W6692846177","https://openalex.org/W6739475399","https://openalex.org/W6769596995","https://openalex.org/W6771730547","https://openalex.org/W6778083458","https://openalex.org/W6778428183","https://openalex.org/W6798090497","https://openalex.org/W6981121735"],"related_works":["https://openalex.org/W2386410636","https://openalex.org/W3038962357","https://openalex.org/W2025663273","https://openalex.org/W3099153698","https://openalex.org/W1501190258","https://openalex.org/W3021988786","https://openalex.org/W4256087190","https://openalex.org/W3099311996","https://openalex.org/W2963971282","https://openalex.org/W4240668504"],"abstract_inverted_index":{"The":[0,150],"recent":[1],"successes":[2],"in":[3,18,30,156],"deep":[4],"reinforcement":[5,40,178],"learning":[6,41,179],"largely":[7],"rely":[8],"on":[9],"the":[10,21,37,59,76,79,84,87,113,124,127,136,147,164],"capabilities":[11],"of":[12,15,23,39,45,78,86,112,126,146],"generating":[13],"masses":[14],"data,":[16],"which":[17],"turn":[19],"implies":[20],"use":[22,75,121],"a":[24,65,140,160,173],"simulator.":[25],"In":[26,68],"particular,":[27],"current":[28],"progress":[29],"multi":[31],"body":[32],"dynamic":[33],"simulators":[34,49],"are":[35,50,72],"under-pinning":[36],"implementation":[38],"for":[42,162,187],"end-to-end":[43,188],"control":[44],"robotic":[46],"systems.":[47],"Yet":[48],"mostly":[51],"considered":[52],"as":[53,159],"black":[54],"boxes":[55],"while":[56],"we":[57,71,91,120,185],"have":[58],"knowledge":[60],"to":[61,74,81,96,122,139],"make":[62],"them":[63],"produce":[64,97],"richer":[66],"information.":[67],"this":[69],"paper,":[70],"proposing":[73],"derivatives":[77],"simulator":[80],"help":[82],"with":[83],"convergence":[85,125],"learning.":[88,131],"For":[89],"that,":[90],"combine":[92],"model-based":[93],"trajectory":[94],"optimization":[95],"informative":[98],"trials":[99],"using":[100,129,181],"1st-":[101],"and":[102,116,142],"2nd-order":[103],"simulation":[104,182],"derivatives.":[105],"These":[106],"locally-optimal":[107],"runs":[108],"give":[109],"fair":[110],"estimates":[111],"value":[114,148,152],"function":[115],"its":[117],"derivatives,":[118,183],"that":[119,135,169,184],"accelerate":[123],"critics":[128],"Sobolev":[130],"We":[132,167],"empirically":[133],"demonstrate":[134],"algorithm":[137,180],"leads":[138],"faster":[141],"more":[143],"accurate":[144],"estimation":[145],"function.":[149],"resulting":[151],"estimate":[153],"is":[154,171],"used":[155],"model-predictive":[157],"controller":[158],"proxy":[161],"shortening":[163],"preview":[165],"horizon.":[166],"believe":[168],"it":[170],"also":[172],"first":[174],"step":[175],"toward":[176],"superlinear":[177],"need":[186],"legged":[189],"locomotion.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
