{"id":"https://openalex.org/W4416750229","doi":"https://doi.org/10.1109/iros60139.2025.11245856","title":"RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation","display_name":"RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416750229","doi":"https://doi.org/10.1109/iros60139.2025.11245856"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11245856","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11245856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072029596","display_name":"Shivam Vats","orcid":null},"institutions":[{"id":"https://openalex.org/I175594653","display_name":"John Brown University","ror":"https://ror.org/02ct41q97","country_code":"US","type":"education","lineage":["https://openalex.org/I175594653"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shivam Vats","raw_affiliation_strings":["Brown University"],"affiliations":[{"raw_affiliation_string":"Brown University","institution_ids":["https://openalex.org/I175594653"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010530960","display_name":"Devesh K. Jha","orcid":"https://orcid.org/0000-0002-7843-9545"},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Devesh K. Jha","raw_affiliation_strings":["Mitsubishi Electric Research Labs"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Labs","institution_ids":["https://openalex.org/I4210133125"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103257510","display_name":"Maxim Likhachev","orcid":"https://orcid.org/0000-0002-9539-2398"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maxim Likhachev","raw_affiliation_strings":["Carnegie Mellon University,Robotics Institute"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Robotics Institute","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005091065","display_name":"Oliver Kroemer","orcid":"https://orcid.org/0000-0003-2007-3867"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oliver Kroemer","raw_affiliation_strings":["Carnegie Mellon University,Robotics Institute"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Robotics Institute","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114494310","display_name":"Diego Romeres","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Diego Romeres","raw_affiliation_strings":["Mitsubishi Electric Research Labs"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Labs","institution_ids":["https://openalex.org/I4210133125"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5072029596"],"corresponding_institution_ids":["https://openalex.org/I175594653"],"apc_list":null,"apc_paid":null,"fwci":1.3682,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.86517712,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"9776","last_page":"9783"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6567999720573425,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6567999720573425,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.26010000705718994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.0333000011742115,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.7710999846458435},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5993000268936157},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.558899998664856},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5478000044822693},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.5080000162124634},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5067999958992004},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.44760000705718994},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.38850000500679016}],"concepts":[{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.7710999846458435},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6556000113487244},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5993000268936157},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.558899998664856},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5478000044822693},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.5080000162124634},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5067999958992004},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.44760000705718994},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42340001463890076},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.38850000500679016},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.34929999709129333},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.33559998869895935},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.32010000944137573},{"id":"https://openalex.org/C31531917","wikidata":"https://www.wikidata.org/wiki/Q915157","display_name":"Robust control","level":3,"score":0.30329999327659607},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.2912999987602234},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.28349998593330383},{"id":"https://openalex.org/C28761237","wikidata":"https://www.wikidata.org/wiki/Q7805321","display_name":"Time horizon","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.26030001044273376}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11245856","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11245856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1762028192","https://openalex.org/W2053910308","https://openalex.org/W2069361969","https://openalex.org/W2109910161","https://openalex.org/W2295598076","https://openalex.org/W2951360122","https://openalex.org/W2968556640","https://openalex.org/W2973229164","https://openalex.org/W3129364384","https://openalex.org/W3150718622","https://openalex.org/W3168892396","https://openalex.org/W3174282793","https://openalex.org/W3190864623","https://openalex.org/W3204657926","https://openalex.org/W4252527162","https://openalex.org/W4313010279","https://openalex.org/W4383108657","https://openalex.org/W4385403811","https://openalex.org/W4394674699"],"related_works":[],"abstract_inverted_index":{"Model-based":[0],"planners":[1],"and":[2,19,37,75,132],"controllers":[3,108],"are":[4,109],"commonly":[5],"used":[6],"to":[7,21,32,44,51,56,77,81,120,123,126,128,135,137,175,179],"solve":[8],"complex":[9],"manipulation":[10,149],"problems":[11],"as":[12,111],"they":[13,26],"can":[14,87],"efficiently":[15],"optimize":[16],"diverse":[17],"objectives":[18],"generalize":[20],"long":[22],"horizon":[23],"tasks.":[24],"However,":[25],"often":[27],"fail":[28],"during":[29],"deployment":[30],"due":[31],"noisy":[33],"actuation,":[34],"partial":[35],"observability":[36],"imperfect":[38],"models.":[39],"To":[40],"enable":[41],"a":[42,58,67,82,101,129,176],"robot":[43,80,178],"recover":[45],"from":[46,84],"such":[47],"failures,":[48],"we":[49],"propose":[50],"use":[52],"hierarchical":[53],"reinforcement":[54],"learning":[55],"learn":[57],"recovery":[59,62,118,160,170],"policy.":[60],"The":[61],"policy":[63,119],"is":[64,69],"triggered":[65],"when":[66,125],"failure":[68],"detected":[70],"based":[71],"on":[72],"sensory":[73],"observations":[74],"seeks":[76],"take":[78],"the":[79,89,92,106,117,181],"state":[83],"which":[85,115,133],"it":[86,155],"complete":[88],"task":[90],"using":[91],"nominal":[93,113,130],"model-based":[94,107],"controllers.":[95],"Our":[96],"approach,":[97],"called":[98],"RecoveryChaining,":[99],"uses":[100],"hybrid":[102],"action":[103],"space,":[104],"where":[105,154],"provided":[110],"additional":[112],"options":[114],"allows":[116],"decide":[121],"how":[122],"recover,":[124],"switch":[127,136],"controller":[131,134],"even":[138],"with":[139,151,186],"sparse":[140,152],"rewards.":[141],"We":[142,167],"evaluate":[143],"our":[144,187],"approach":[145],"in":[146,173],"three":[147],"multi-step":[148],"tasks":[150],"rewards,":[153],"learns":[156],"significantly":[157],"more":[158],"robust":[159],"policies":[161,171],"than":[162],"those":[163],"learned":[164,172],"by":[165],"baselines.":[166],"successfully":[168],"transfer":[169,185],"simulation":[174],"physical":[177],"demonstrate":[180],"feasibility":[182],"of":[183],"sim-to-real":[184],"method.":[188]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
