{"id":"https://openalex.org/W4414322693","doi":"https://doi.org/10.1109/ecmr65884.2025.11163057","title":"End-to-End Multi-Task Policy Learning from NMPC for Quadruped Locomotion","display_name":"End-to-End Multi-Task Policy Learning from NMPC for Quadruped Locomotion","publication_year":2025,"publication_date":"2025-09-02","ids":{"openalex":"https://openalex.org/W4414322693","doi":"https://doi.org/10.1109/ecmr65884.2025.11163057"},"language":"en","primary_location":{"id":"doi:10.1109/ecmr65884.2025.11163057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ecmr65884.2025.11163057","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 European Conference on Mobile Robots (ECMR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pub.h-brs.de/frontdoor/index/index/docId/9015","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119665450","display_name":"Anudeep Sajja","orcid":null},"institutions":[{"id":"https://openalex.org/I155417937","display_name":"Hochschule Bonn-Rhein-Sieg","ror":"https://ror.org/04m2anh63","country_code":"DE","type":"education","lineage":["https://openalex.org/I155417937"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Anudeep Sajja","raw_affiliation_strings":["Bonn-Rhein-Sieg University of Applied Sciences,Institute for Artificial Intelligence and Autonomous Systems (A2S),Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Bonn-Rhein-Sieg University of Applied Sciences,Institute for Artificial Intelligence and Autonomous Systems (A2S),Sankt Augustin,Germany","institution_ids":["https://openalex.org/I155417937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046601607","display_name":"Shahram Khorshidi","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Shahram Khorshidi","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab,Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020225503","display_name":"Sebastian Houben","orcid":"https://orcid.org/0000-0002-2036-419X"},"institutions":[{"id":"https://openalex.org/I155417937","display_name":"Hochschule Bonn-Rhein-Sieg","ror":"https://ror.org/04m2anh63","country_code":"DE","type":"education","lineage":["https://openalex.org/I155417937"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sebastian Houben","raw_affiliation_strings":["Bonn-Rhein-Sieg University of Applied Sciences,Institute for Artificial Intelligence and Autonomous Systems (A2S),Sankt Augustin,Germany"],"affiliations":[{"raw_affiliation_string":"Bonn-Rhein-Sieg University of Applied Sciences,Institute for Artificial Intelligence and Autonomous Systems (A2S),Sankt Augustin,Germany","institution_ids":["https://openalex.org/I155417937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103231515","display_name":"Maren Bennewitz","orcid":"https://orcid.org/0000-0003-4343-3028"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Maren Bennewitz","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab,Germany","institution_ids":["https://openalex.org/I135140700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5119665450"],"corresponding_institution_ids":["https://openalex.org/I155417937"],"apc_list":null,"apc_paid":null,"fwci":1.1617,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.82694635,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9498999714851379,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9498999714851379,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.942300021648407,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9355000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6086999773979187},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.5792999863624573},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.505299985408783},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5029000043869019},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4830999970436096},{"id":"https://openalex.org/keywords/traverse","display_name":"Traverse","score":0.4675000011920929},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.42239999771118164},{"id":"https://openalex.org/keywords/gait","display_name":"Gait","score":0.41110000014305115},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.3921000063419342}],"concepts":[{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6086999773979187},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.5792999863624573},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5698999762535095},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.505299985408783},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5029000043869019},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.4675000011920929},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4666000008583069},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.45170000195503235},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.42239999771118164},{"id":"https://openalex.org/C151800584","wikidata":"https://www.wikidata.org/wiki/Q2370000","display_name":"Gait","level":2,"score":0.41110000014305115},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.3921000063419342},{"id":"https://openalex.org/C2984755018","wikidata":"https://www.wikidata.org/wiki/Q17118374","display_name":"Nonlinear model","level":3,"score":0.3806999921798706},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.37619999051094055},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3734999895095825},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.33640000224113464},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.3246000111103058},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3221000134944916},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.3133000135421753},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.30000001192092896},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2973000109195709},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.27570000290870667},{"id":"https://openalex.org/C6101204","wikidata":"https://www.wikidata.org/wiki/Q7353391","display_name":"Robot locomotion","level":5,"score":0.2678000032901764},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.2639999985694885},{"id":"https://openalex.org/C79487989","wikidata":"https://www.wikidata.org/wiki/Q934680","display_name":"Vehicle dynamics","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.260699987411499}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/ecmr65884.2025.11163057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ecmr65884.2025.11163057","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 European Conference on Mobile Robots (ECMR)","raw_type":"proceedings-article"},{"id":"pmh:oai:pub.h-brs.de:9015","is_oa":true,"landing_page_url":"https://pub.h-brs.de/frontdoor/index/index/docId/9015","pdf_url":null,"source":{"id":"https://openalex.org/S4306400385","display_name":"Publication Server of Bonn-Rhein-Sieg University of Applied Sciences (Bonn-Rhein-Sieg University of Applied Sciences)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I135140700","host_organization_name":"University of Bonn","host_organization_lineage":["https://openalex.org/I135140700"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISSN 2331-8422","raw_type":"doc-type:preprint"},{"id":"pmh:oai:pub.h-brs.de:9241","is_oa":false,"landing_page_url":"https://pub.h-brs.de/frontdoor/index/index/docId/9241","pdf_url":null,"source":{"id":"https://openalex.org/S4306400385","display_name":"Publication Server of Bonn-Rhein-Sieg University of Applied Sciences (Bonn-Rhein-Sieg University of Applied Sciences)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I135140700","host_organization_name":"University of Bonn","host_organization_lineage":["https://openalex.org/I135140700"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2025 European Conference on Mobile Robots (ECMR), 02-05 September 2025, Padova, Italy","raw_type":"doc-type:conferenceobject"},{"id":"pmh:oai:publica.fraunhofer.de:publica/497564","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/497564","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":{"id":"pmh:oai:pub.h-brs.de:9015","is_oa":true,"landing_page_url":"https://pub.h-brs.de/frontdoor/index/index/docId/9015","pdf_url":null,"source":{"id":"https://openalex.org/S4306400385","display_name":"Publication Server of Bonn-Rhein-Sieg University of Applied Sciences (Bonn-Rhein-Sieg University of Applied Sciences)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I135140700","host_organization_name":"University of Bonn","host_organization_lineage":["https://openalex.org/I135140700"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISSN 2331-8422","raw_type":"doc-type:preprint"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321408","display_name":"Ministry of Education","ror":"https://ror.org/01p262204"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2029517350","https://openalex.org/W2149606028","https://openalex.org/W2571115941","https://openalex.org/W2911087563","https://openalex.org/W3093922502","https://openalex.org/W3141797743","https://openalex.org/W3142410314","https://openalex.org/W3201541172","https://openalex.org/W4226143977","https://openalex.org/W4289522461","https://openalex.org/W4300892751","https://openalex.org/W4313639240","https://openalex.org/W4378696928","https://openalex.org/W4383108391","https://openalex.org/W4387682164","https://openalex.org/W4389665904","https://openalex.org/W4405785263","https://openalex.org/W4406779533","https://openalex.org/W4413917243"],"related_works":[],"abstract_inverted_index":{"Quadruped":[0],"robots":[1,10],"excel":[2],"in":[3,64,78,115],"traversing":[4],"complex,":[5],"unstructured":[6],"environments":[7],"where":[8],"wheeled":[9],"often":[11],"fail.":[12],"However,":[13],"enabling":[14],"efficient":[15],"and":[16,31,58,117,132],"adaptable":[17],"locomotion":[18,96],"remains":[19],"challenging":[20],"due":[21],"to":[22,85,91],"the":[23,32,110,134],"quadrupeds'":[24],"nonlinear":[25],"dynamics,":[26],"high":[27,59,152],"degrees":[28],"of":[29,35,164],"freedom,":[30],"computational":[33,60],"demands":[34],"real-time":[36,138],"control.":[37],"Optimization-based":[38],"controllers,":[39],"such":[40],"as":[41],"Nonlinear":[42],"Model":[43],"Predictive":[44],"Control":[45],"(NMPC),":[46],"have":[47],"shown":[48],"strong":[49],"performance,":[50],"but":[51],"their":[52],"reliance":[53],"on":[54,109,118],"accurate":[55],"state":[56],"estimation":[57],"overhead":[61],"makes":[62],"deployment":[63],"real-world":[65],"settings":[66],"challenging.":[67],"In":[68],"this":[69,165],"work,":[70],"we":[71],"present":[72],"a":[73,87,148],"Multi-Task":[74],"Learning":[75],"(MTL)":[76],"framework":[77],"which":[79],"expert":[80,126],"NMPC":[81],"demonstrations":[82],"are":[83],"used":[84],"train":[86],"single":[88],"neural":[89],"network":[90],"predict":[92],"actions":[93],"for":[94,137,155],"multiple":[95],"behaviors":[97],"directly":[98],"from":[99],"raw":[100],"proprioceptive":[101],"sensor":[102],"inputs.":[103],"We":[104],"evaluate":[105],"our":[106],"approach":[107],"extensively":[108],"quadruped":[111],"robot":[112],"Go1,":[113],"both":[114],"simulation":[116],"real":[119],"hardware,":[120],"demonstrating":[121],"that":[122],"it":[123],"accurately":[124],"reproduces":[125],"behavior,":[127],"allows":[128],"smooth":[129],"gait":[130],"switching,":[131],"simplifies":[133],"control":[135],"pipeline":[136],"deployment.":[139],"Our":[140],"MTL":[141],"architecture":[142],"enables":[143],"learning":[144],"diverse":[145],"gaits":[146],"within":[147],"unified":[149],"policy,":[150],"achieving":[151],"R<sup>2</sup>":[153],"scores":[154],"predicted":[156],"joint":[157],"targets":[158],"across":[159],"all":[160],"tasks.":[161],"The":[162],"results":[163],"research":[166],"can":[167],"be":[168],"found":[169],"here.":[170]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
