{"id":"https://openalex.org/W4405778675","doi":"https://doi.org/10.1109/iros58592.2024.10802334","title":"CaT: Constraints as Terminations for Legged Locomotion Reinforcement Learning","display_name":"CaT: Constraints as Terminations for Legged Locomotion Reinforcement Learning","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405778675","doi":"https://doi.org/10.1109/iros58592.2024.10802334"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10802334","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10802334","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://laas.hal.science/hal-04523167/document","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072932583","display_name":"Elliot Chane-Sane","orcid":null},"institutions":[{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Elliot Chane-Sane","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021493522","display_name":"Pierre\u2010Alexandre L\u00e9ziart","orcid":"https://orcid.org/0000-0002-5653-4613"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pierre-Alexandre Leziart","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053901723","display_name":"Thomas Flayols","orcid":"https://orcid.org/0000-0001-8078-2206"},"institutions":[{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Thomas Flayols","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071048560","display_name":"Olivier Stasse","orcid":"https://orcid.org/0000-0001-8569-6155"},"institutions":[{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Olivier Stasse","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014128188","display_name":"Philippe Sou\u00e8res","orcid":"https://orcid.org/0000-0001-9064-4405"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Philippe Sou\u00e8res","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046876471","display_name":"Nicolas Mansard","orcid":"https://orcid.org/0000-0002-8090-0601"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I190497903","display_name":"Laboratoire d'Analyse et d'Architecture des Syst\u00e8mes","ror":"https://ror.org/03vcm6439","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I134560555","https://openalex.org/I190497903","https://openalex.org/I196454796","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210095849","https://openalex.org/I4210159245","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I17866349","display_name":"Universit\u00e9 F\u00e9d\u00e9rale de Toulouse Midi-Pyr\u00e9n\u00e9es","ror":"https://ror.org/004raaa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I17866349"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Nicolas Mansard","raw_affiliation_strings":["Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Toulouse,LAAS-CNRS,Toulouse,France,31400","institution_ids":["https://openalex.org/I17866349","https://openalex.org/I1294671590","https://openalex.org/I190497903"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5072932583"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I17866349","https://openalex.org/I190497903"],"apc_list":null,"apc_paid":null,"fwci":3.1156,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.92264347,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"13303","last_page":"13310"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8176651000976562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6160929799079895},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5280250906944275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39789363741874695},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20537325739860535},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.13761043548583984}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8176651000976562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6160929799079895},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5280250906944275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39789363741874695},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20537325739860535},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.13761043548583984}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iros58592.2024.10802334","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10802334","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-04523167v1","is_oa":true,"landing_page_url":"https://laas.hal.science/hal-04523167","pdf_url":"https://laas.hal.science/hal-04523167/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), IEEE, Oct 2024, Abu Dhabi, Emirats Arabes Unis, United Arab Emirates. pp.13303-13310, &#x27E8;10.1109/IROS58592.2024.10802334&#x27E9;","raw_type":"Conference papers"},{"id":"pmh:oai:zenodo.org:15175521","is_oa":true,"landing_page_url":"https://doi.org/10.1109/IROS58592.2024.10802334","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IROS, IEEE/RSJ International Conference on Intelligent Robots and Systems, Abudhabi","raw_type":"info:eu-repo/semantics/other"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-04523167v1","is_oa":true,"landing_page_url":"https://laas.hal.science/hal-04523167","pdf_url":"https://laas.hal.science/hal-04523167/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), IEEE, Oct 2024, Abu Dhabi, Emirats Arabes Unis, United Arab Emirates. pp.13303-13310, &#x27E8;10.1109/IROS58592.2024.10802334&#x27E9;","raw_type":"Conference papers"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1938070154","display_name":null,"funder_award_id":"ANR-19-P3IA-0004","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3023330841","display_name":"Robot motion with physical interactions and social adaptation","funder_award_id":"ANR-22-EXOD-0006","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3441976835","display_name":null,"funder_award_id":"10-EQPX-44-01","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3896488107","display_name":null,"funder_award_id":"ANR-21-ESRE-0015","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G4668411266","display_name":"Dynamograde - The force in walking","funder_award_id":"ANR-21-LCV3-0002","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G5183769820","display_name":null,"funder_award_id":"ANR-10-EQPX-44-01","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G693040958","display_name":null,"funder_award_id":"ANR-10-EQPX-44","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7240651115","display_name":null,"funder_award_id":"ANR-10","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8318455765","display_name":null,"funder_award_id":"ANR-19","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8510727784","display_name":null,"funder_award_id":"ANR-10-EQPX","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"},{"id":"https://openalex.org/F4320326256","display_name":"Grand \u00c9quipement National De Calcul Intensif","ror":"https://ror.org/0010d1q40"},{"id":"https://openalex.org/F4320328356","display_name":"R\u00e9gion Occitanie Pyr\u00e9n\u00e9es-M\u00e9diterran\u00e9e","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405778675.pdf"},"referenced_works_count":66,"referenced_works":["https://openalex.org/W2049606892","https://openalex.org/W2099506495","https://openalex.org/W2133859362","https://openalex.org/W2158782408","https://openalex.org/W2296073425","https://openalex.org/W2529220408","https://openalex.org/W2736601468","https://openalex.org/W2767050701","https://openalex.org/W2769646558","https://openalex.org/W2804791273","https://openalex.org/W2963184939","https://openalex.org/W2963575966","https://openalex.org/W2977389550","https://openalex.org/W2998619042","https://openalex.org/W3007035358","https://openalex.org/W3039737909","https://openalex.org/W3089750699","https://openalex.org/W3101442004","https://openalex.org/W3101798601","https://openalex.org/W3105372678","https://openalex.org/W3123742938","https://openalex.org/W3125490529","https://openalex.org/W3134580056","https://openalex.org/W3162902207","https://openalex.org/W3175254947","https://openalex.org/W3204973825","https://openalex.org/W3209211683","https://openalex.org/W3213974477","https://openalex.org/W4226250682","https://openalex.org/W4252189904","https://openalex.org/W4283787029","https://openalex.org/W4285600796","https://openalex.org/W4286373058","https://openalex.org/W4286423847","https://openalex.org/W4287113927","https://openalex.org/W4293566197","https://openalex.org/W4309323738","https://openalex.org/W4312900898","https://openalex.org/W4313196885","https://openalex.org/W4385430550","https://openalex.org/W4385475819","https://openalex.org/W4386721362","https://openalex.org/W4387158111","https://openalex.org/W4389627470","https://openalex.org/W4389667415","https://openalex.org/W4390481291","https://openalex.org/W4390730760","https://openalex.org/W4392763392","https://openalex.org/W4396910086","https://openalex.org/W4401415792","https://openalex.org/W4401416668","https://openalex.org/W4402354142","https://openalex.org/W6687063787","https://openalex.org/W6737893269","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6751725685","https://openalex.org/W6797154179","https://openalex.org/W6800004206","https://openalex.org/W6801964084","https://openalex.org/W6802654813","https://openalex.org/W6846664724","https://openalex.org/W6857202355","https://openalex.org/W6857483907","https://openalex.org/W6857635845","https://openalex.org/W6859300450"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856"],"abstract_inverted_index":{"Deep":[0],"Reinforcement":[1],"Learning":[2],"(RL)":[3],"has":[4],"demonstrated":[5],"impressive":[6],"results":[7],"in":[8,99],"solving":[9],"complex":[10],"robotic":[11],"tasks":[12],"such":[13],"as":[14,42,103],"quadruped":[15,133],"locomotion.":[16],"Yet,":[17],"current":[18],"solvers":[19],"fail":[20],"to":[21,88,110,124],"produce":[22],"efficient":[23],"policies":[24],"respecting":[25],"hard":[26],"constraints.":[27],"In":[28],"this":[29,89],"work,":[30],"we":[31,56,139],"advocate":[32],"for":[33,147],"integrating":[34],"constraints":[35,58,149],"into":[36,150],"robot":[37,100,134],"learning":[38,101],"and":[39,118,154],"present":[40],"Constraints":[41],"Terminations":[43],"(CaT),":[44],"a":[45,68,71,144],"novel":[46],"constrained":[47,53],"RL":[48,54,79,97,151],"algorithm.":[49],"Departing":[50],"from":[51],"classical":[52],"formulations,":[55],"reformulate":[57],"through":[59],"stochastic":[60],"terminations":[61],"during":[62],"policy":[63],"learning:":[64],"any":[65],"violation":[66],"of":[67,73],"constraint":[69,112],"triggers":[70],"probability":[72],"terminating":[74],"potential":[75],"future":[76],"rewards":[77],"the":[78,131],"agent":[80],"could":[81],"attain.":[82],"We":[83],"propose":[84],"an":[85],"algorithmic":[86],"approach":[87,108],"formulation,":[90],"by":[91],"minimally":[92],"modifying":[93],"widely":[94],"used":[95],"off-the-shelf":[96],"algorithms":[98],"(such":[102],"Proximal":[104],"Policy":[105],"Optimization).":[106],"Our":[107],"leads":[109],"excellent":[111],"adherence":[113],"without":[114],"introducing":[115],"undue":[116],"complexity":[117],"computational":[119],"overhead,":[120],"thus":[121],"mitigating":[122],"barriers":[123],"broader":[125],"adoption.":[126],"Through":[127],"empirical":[128],"evaluation":[129],"on":[130],"real":[132],"Solo":[135],"crossing":[136],"challenging":[137],"obstacles,":[138],"demonstrate":[140],"that":[141],"CaT":[142],"provides":[143],"compelling":[145],"solution":[146],"incorporating":[148],"frameworks.":[152],"Videos":[153],"code":[155],"are":[156],"available":[157],"at":[158],"constraints-as-terminations.github.io.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":15}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
