{"id":"https://openalex.org/W4415178994","doi":"https://doi.org/10.1109/tase.2025.3620908","title":"Residual Policy Optimization With Trust Region Constraints: A Learning Framework for Stable and Agile Wheel-Legged Locomotion","display_name":"Residual Policy Optimization With Trust Region Constraints: A Learning Framework for Stable and Agile Wheel-Legged Locomotion","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4415178994","doi":"https://doi.org/10.1109/tase.2025.3620908"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2025.3620908","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3620908","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018631736","display_name":"Naifeng He","orcid":"https://orcid.org/0000-0003-3646-1899"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Naifeng He","raw_affiliation_strings":["College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhong Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhong Yang","raw_affiliation_strings":["College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073192646","display_name":"Xiaoliang Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoliang Fan","raw_affiliation_strings":["State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]},{"raw_affiliation_string":"Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111537301","display_name":"W. Que","orcid":null},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenqiang Que","raw_affiliation_strings":["College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016140257","display_name":"Siyang Liu","orcid":"https://orcid.org/0000-0002-4050-5113"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Siyang Liu","raw_affiliation_strings":["Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102655171","display_name":"Hongyu Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyu Xu","raw_affiliation_strings":["College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"College of Automation, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113680366","display_name":"Chunguang Bu","orcid":"https://orcid.org/0000-0002-3880-1175"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunguang Bu","raw_affiliation_strings":["State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]},{"raw_affiliation_string":"Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101898281","display_name":"Bi Zhang","orcid":"https://orcid.org/0000-0001-8001-002X"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bi Zhang","raw_affiliation_strings":["State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Intelligent Systems, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]},{"raw_affiliation_string":"Shenyang Institute of Automation, State Key Laboratory of Robotics and Intelligent Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5018631736"],"corresponding_institution_ids":["https://openalex.org/I9842412"],"apc_list":null,"apc_paid":null,"fwci":1.2077,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.82765895,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"22","issue":null,"first_page":"23352","last_page":"23365"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13295","display_name":"Safety Systems Engineering in Autonomy","score":0.8736000061035156,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13295","display_name":"Safety Systems Engineering in Autonomy","score":0.8736000061035156,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12000","display_name":"Systems Engineering Methodologies and Applications","score":0.8730999827384949,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.8652999997138977,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.6496999859809875},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.6395000219345093},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.6050999760627747},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6028000116348267},{"id":"https://openalex.org/keywords/tree-traversal","display_name":"Tree traversal","score":0.5590999722480774},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5489000082015991},{"id":"https://openalex.org/keywords/agile-software-development","display_name":"Agile software development","score":0.5462999939918518},{"id":"https://openalex.org/keywords/compensation","display_name":"Compensation (psychology)","score":0.5159000158309937},{"id":"https://openalex.org/keywords/tracking-error","display_name":"Tracking error","score":0.5127000212669373}],"concepts":[{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.6496999859809875},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6434999704360962},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.6395000219345093},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.6050999760627747},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6028000116348267},{"id":"https://openalex.org/C140745168","wikidata":"https://www.wikidata.org/wiki/Q1210082","display_name":"Tree traversal","level":2,"score":0.5590999722480774},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5489000082015991},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.5462999939918518},{"id":"https://openalex.org/C2780023022","wikidata":"https://www.wikidata.org/wiki/Q1338171","display_name":"Compensation (psychology)","level":2,"score":0.5159000158309937},{"id":"https://openalex.org/C183356978","wikidata":"https://www.wikidata.org/wiki/Q1779213","display_name":"Tracking error","level":3,"score":0.5127000212669373},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5088000297546387},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.4478999972343445},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3815000057220459},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3781000077724457},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3700999915599823},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.3517000079154968},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.3476000130176544},{"id":"https://openalex.org/C172707124","wikidata":"https://www.wikidata.org/wiki/Q423488","display_name":"Actuator","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.3158999979496002},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3070000112056732},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.2994999885559082},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.26499998569488525},{"id":"https://openalex.org/C2780799671","wikidata":"https://www.wikidata.org/wiki/Q17087362","display_name":"Transient (computer programming)","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2596000134944916},{"id":"https://openalex.org/C2779908020","wikidata":"https://www.wikidata.org/wiki/Q1424704","display_name":"Legged robot","level":3,"score":0.25940001010894775}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2025.3620908","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3620908","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G273163530","display_name":null,"funder_award_id":"2025JH6/101000028","funder_id":"https://openalex.org/F4320323086","funder_display_name":"Natural Science Foundation of Liaoning Province"},{"id":"https://openalex.org/G490398268","display_name":null,"funder_award_id":"GXKJXM20230169","funder_id":"https://openalex.org/F4320330373","funder_display_name":"Research and Innovation in Science and Technology Project"},{"id":"https://openalex.org/G4998699962","display_name":null,"funder_award_id":"Grant 2025JH6/101000028","funder_id":"https://openalex.org/F4320323086","funder_display_name":"Natural Science Foundation of Liaoning Province"}],"funders":[{"id":"https://openalex.org/F4320323086","display_name":"Natural Science Foundation of Liaoning Province","ror":null},{"id":"https://openalex.org/F4320330373","display_name":"Research and Innovation in Science and Technology Project","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W2035757418","https://openalex.org/W2605102758","https://openalex.org/W2767050701","https://openalex.org/W3093922502","https://openalex.org/W3127561923","https://openalex.org/W3152673644","https://openalex.org/W3161546367","https://openalex.org/W4205430897","https://openalex.org/W4206497039","https://openalex.org/W4283786226","https://openalex.org/W4283793632","https://openalex.org/W4285600796","https://openalex.org/W4292852788","https://openalex.org/W4293160779","https://openalex.org/W4312423130","https://openalex.org/W4313196885","https://openalex.org/W4378696928","https://openalex.org/W4383108274","https://openalex.org/W4383109371","https://openalex.org/W4387831910","https://openalex.org/W4390357468","https://openalex.org/W4390938336","https://openalex.org/W4392763392","https://openalex.org/W4393159608","https://openalex.org/W4394674699","https://openalex.org/W4395116617","https://openalex.org/W4396910086","https://openalex.org/W4399727781","https://openalex.org/W4401415577","https://openalex.org/W4401415792","https://openalex.org/W4401415879","https://openalex.org/W4402216758","https://openalex.org/W4402300083","https://openalex.org/W4402354103","https://openalex.org/W4402354142","https://openalex.org/W4403318432","https://openalex.org/W4404576594","https://openalex.org/W4404688052","https://openalex.org/W4405778675","https://openalex.org/W4405778837","https://openalex.org/W4405785337","https://openalex.org/W4405786631","https://openalex.org/W4405787394","https://openalex.org/W4410614007","https://openalex.org/W4413925046"],"related_works":[],"abstract_inverted_index":{"Wheel-legged":[0],"robots":[1],"integrate":[2],"the":[3,9,78,139,168],"adaptability":[4,120],"of":[5,11,73,198],"legged":[6],"locomotion":[7,40],"with":[8,58,204],"efficiency":[10],"wheeled":[12],"movement,":[13],"enabling":[14,70],"agile":[15],"traversal":[16,175],"across":[17],"diverse":[18,161],"terrains.":[19],"However,":[20],"abrupt":[21],"terrain":[22,162,174],"transitions":[23,100],"introduce":[24,90],"substantial":[25],"state":[26,49,75],"variations,":[27],"including":[28],"velocity":[29,180,195],"fluctuations,":[30],"posture":[31],"shifts,":[32],"and":[33,154,178,188,201,206,213],"slippage,":[34],"which":[35,96],"pose":[36],"significant":[37],"challenges":[38],"to":[39,84,121,149,210],"stability.":[41],"To":[42,125],"address":[43],"these":[44],"issues,":[45],"we":[46,89],"propose":[47],"a":[48,55,59,91,114,172,193],"error":[50,106,197],"compensation":[51,82],"framework":[52,110,170],"that":[53,167],"integrates":[54],"residual":[56,63,152],"network":[57,64],"trust-region":[60,79],"mechanism.":[61],"The":[62,108],"implicitly":[65],"captures":[66],"nonlinear":[67],"contact":[68],"dynamics,":[69],"real-time":[71],"correction":[72],"slippage-induced":[74],"deviations,":[76],"while":[77],"mechanism":[80],"regulates":[81],"amplitude":[83],"maintain":[85],"stable":[86,202],"locomotion.":[87],"Furthermore,":[88],"dual-source":[92],"contrastive":[93],"learning":[94,117],"strategy,":[95],"explicitly":[97],"differentiates":[98],"terrain-induced":[99],"from":[101],"external":[102],"perturbations,":[103],"facilitating":[104],"context-aware":[105],"recovery.":[107],"proposed":[109,169],"is":[111,133],"integrated":[112],"into":[113],"model-free":[115],"reinforcement":[116],"pipeline,":[118],"ensuring":[119],"previously":[122],"unseen":[123],"environments.":[124],"further":[126],"enhance":[127],"robustness,":[128],"an":[129],"uncertainty-aware":[130],"calibration":[131],"module":[132,136],"introduced.":[134],"This":[135],"dynamically":[137],"adjusts":[138],"trust":[140],"region":[141],"boundary":[142],"in":[143],"real":[144],"time,":[145],"leveraging":[146],"sensory":[147],"feedback":[148],"adaptively":[150],"constrain":[151],"corrections":[153],"prevent":[155],"over-adjustment,":[156],"thereby":[157],"maintaining":[158],"stability":[159],"during":[160],"transitions.":[163],"Experimental":[164],"results":[165],"demonstrate":[166],"achieves":[171],"96.7%":[173],"success":[176],"rate":[177],"92%":[179],"tracking":[181,196],"accuracy":[182],"under":[183],"dynamic":[184],"disturbances.":[185],"On":[186],"unstructured":[187],"mixed":[189],"terrains,":[190],"it":[191],"maintains":[192],"mean":[194],"0.15":[199],"m/s":[200],"posture,":[203],"pitch":[205],"roll":[207],"angles":[208],"constrained":[209],"\u00b10.04":[211],"rad":[212],"\u00b10.02":[214],"rad,":[215],"respectively.":[216]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-15T00:00:00"}
