{"id":"https://openalex.org/W7130728162","doi":"https://doi.org/10.1109/lra.2026.3666686","title":"VPIES: Variational Privileged Information Encoder as Scaffold for Legged Locomotion Learning","display_name":"VPIES: Variational Privileged Information Encoder as Scaffold for Legged Locomotion Learning","publication_year":2026,"publication_date":"2026-02-20","ids":{"openalex":"https://openalex.org/W7130728162","doi":"https://doi.org/10.1109/lra.2026.3666686"},"language":null,"primary_location":{"id":"doi:10.1109/lra.2026.3666686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3666686","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030583825","display_name":"Yubiao Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yubiao Ma","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126518550","display_name":"Han Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126065","display_name":"Shanghai Electric (China)","ror":"https://ror.org/0314qy595","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210126065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Han Yu","raw_affiliation_strings":["Humanoid Robotics (Shanghai) Company, Ltd., Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Humanoid Robotics (Shanghai) Company, Ltd., Shanghai, China","institution_ids":["https://openalex.org/I4210126065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126506013","display_name":"Kai Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Guo","raw_affiliation_strings":["School of Mechanical Engineering, Shandong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101754705","display_name":"Boyang Xing","orcid":"https://orcid.org/0000-0003-0495-8040"},"institutions":[{"id":"https://openalex.org/I4210126065","display_name":"Shanghai Electric (China)","ror":"https://ror.org/0314qy595","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210126065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boyang Xing","raw_affiliation_strings":["Humanoid Robotics (Shanghai) Company, Ltd., Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Humanoid Robotics (Shanghai) Company, Ltd., Shanghai, China","institution_ids":["https://openalex.org/I4210126065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122860625","display_name":"Xuemei Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuemei Ren","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126450675","display_name":"Dongdong Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongdong Zheng","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5030583825"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.63526972,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"4","first_page":"5119","last_page":"5126"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9768999814987183,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9768999814987183,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.003700000001117587,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.003100000089034438,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.670199990272522},{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.5914999842643738},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5764999985694885},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.489300012588501},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4555000066757202},{"id":"https://openalex.org/keywords/agile-software-development","display_name":"Agile software development","score":0.4544999897480011},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.4198000133037567},{"id":"https://openalex.org/keywords/inverted-pendulum","display_name":"Inverted pendulum","score":0.38769999146461487},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.38119998574256897}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6718999743461609},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.670199990272522},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.5914999842643738},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5764999985694885},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47620001435279846},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.4544999897480011},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.4198000133037567},{"id":"https://openalex.org/C192921069","wikidata":"https://www.wikidata.org/wiki/Q550134","display_name":"Inverted pendulum","level":3,"score":0.38769999146461487},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.38119998574256897},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3779999911785126},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.31700000166893005},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.31290000677108765},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.30809998512268066},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.3034000098705292},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3010999858379364},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.2912999987602234},{"id":"https://openalex.org/C89429830","wikidata":"https://www.wikidata.org/wiki/Q735710","display_name":"Scaffold","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.27900001406669617},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2718000113964081},{"id":"https://openalex.org/C2776319952","wikidata":"https://www.wikidata.org/wiki/Q2451755","display_name":"Stair climbing","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.267300009727478},{"id":"https://openalex.org/C2780704645","wikidata":"https://www.wikidata.org/wiki/Q9251458","display_name":"Observer (physics)","level":2,"score":0.267300009727478},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2623000144958496},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2026.3666686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3666686","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1970209023","https://openalex.org/W2168359464","https://openalex.org/W2963223306","https://openalex.org/W3093922502","https://openalex.org/W3121342653","https://openalex.org/W3175254947","https://openalex.org/W3176131607","https://openalex.org/W4205430897","https://openalex.org/W4207072548","https://openalex.org/W4235114045","https://openalex.org/W4250058668","https://openalex.org/W4382365373","https://openalex.org/W4383108274","https://openalex.org/W4385430644","https://openalex.org/W4385430674","https://openalex.org/W4400314673","https://openalex.org/W4401070717","https://openalex.org/W4401415792","https://openalex.org/W4402354114","https://openalex.org/W4402401628","https://openalex.org/W4405786612","https://openalex.org/W4416749645"],"related_works":[],"abstract_inverted_index":{"Legged":[0],"robots":[1],"face":[2],"significant":[3],"challenges":[4],"in":[5],"complex":[6],"terrains":[7],"due":[8],"to":[9,133],"partial":[10],"observability.":[11],"While":[12],"teacher-student":[13],"frameworks":[14],"address":[15,31],"this":[16,78],"through":[17],"imitation,":[18],"they":[19],"often":[20],"cause":[21],"representation":[22],"mismatch":[23],"and":[24,55,88,125,147,155,164],"covariate":[25],"shift,":[26],"limiting":[27],"deployment":[28,148],"robustness.":[29],"To":[30,83],"these":[32],"limitations,":[33],"we":[34],"propose":[35],"the":[36,85,112,139,150,162],"Variational":[37],"Privileged":[38],"Information":[39],"Encoder":[40],"as":[41],"Scaffold":[42],"(VPIES),":[43],"a":[44,52,56,66,94],"single-stage":[45],"reinforcement":[46],"learning":[47],"framework":[48],"that":[49,75,98],"consists":[50],"of":[51,166],"variational":[53,67],"encoder":[54,97],"dual-timescale":[57,95],"proprioceptive":[58,96],"history":[59],"encoder.":[60],"VPIES":[61,92,120,167],"encodes":[62],"privileged":[63],"states":[64],"into":[65],"latent":[68],"for":[69,80,114,168],"guided":[70],"exploration,":[71],"with":[72,103],"adaptive":[73],"KL-annealing":[74],"progressively":[76],"removes":[77],"scaffold":[79],"privilege-free":[81],"deployment.":[82],"support":[84],"resulting":[86],"handover":[87],"capture":[89],"multi-scale":[90],"dynamics,":[91],"adopts":[93],"combines":[99],"short-horizon":[100],"reactive":[101],"control":[102],"long-horizon":[104],"phase-consistent":[105],"adaptation":[106],"from":[107],"proprioception":[108],"alone,":[109],"thereby":[110],"eliminating":[111],"need":[113],"explicit":[115],"environment":[116],"identification.":[117],"In":[118],"simulation,":[119],"reduces":[121],"velocity":[122],"tracking":[123],"error":[124],"improves":[126],"out-of-distribution":[127],"robustness":[128,165],"by":[129],"approximately":[130],"20%":[131],"compared":[132],"strong":[134],"baselines.":[135],"Real-world":[136],"experiments":[137],"on":[138,149],"Unitree":[140],"Go2":[141],"achieve":[142],"higher":[143],"terrain":[144],"success":[145],"rates,":[146],"humanoid":[151],"G1":[152],"demonstrates":[153],"stable":[154],"agile":[156],"locomotion,":[157],"including":[158],"stair":[159],"climbing,":[160],"confirming":[161],"practicality":[163],"legged":[169],"systems.":[170]},"counts_by_year":[],"updated_date":"2026-03-14T06:41:57.775601","created_date":"2026-02-21T00:00:00"}
