{"id":"https://openalex.org/W4414110571","doi":"https://doi.org/10.1109/lra.2025.3608637","title":"PPF: Pre-Training and Preservative Fine-Tuning of Humanoid Locomotion via Model-Assumption-Based Regularization","display_name":"PPF: Pre-Training and Preservative Fine-Tuning of Humanoid Locomotion via Model-Assumption-Based Regularization","publication_year":2025,"publication_date":"2025-09-10","ids":{"openalex":"https://openalex.org/W4414110571","doi":"https://doi.org/10.1109/lra.2025.3608637"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2025.3608637","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3608637","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.09833","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086312555","display_name":"Hyunyoung Jung","orcid":"https://orcid.org/0009-0001-7382-9608"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hyunyoung Jung","raw_affiliation_strings":["Georgia Institute of Technology, Atlanta, GA, USA"],"raw_orcid":"https://orcid.org/0009-0001-7382-9608","affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022169367","display_name":"Zhaoyuan Gu","orcid":"https://orcid.org/0000-0003-0371-9005"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhaoyuan Gu","raw_affiliation_strings":["Georgia Institute of Technology, Atlanta, GA, USA"],"raw_orcid":"https://orcid.org/0000-0003-0371-9005","affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113946098","display_name":"Ye Zhao","orcid":"https://orcid.org/0000-0001-6402-5416"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ye Zhao","raw_affiliation_strings":["Georgia Institute of Technology, Atlanta, GA, USA"],"raw_orcid":"https://orcid.org/0000-0001-6402-5416","affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090151532","display_name":"Hae-Won Park","orcid":"https://orcid.org/0000-0001-6130-6589"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hae-Won Park","raw_affiliation_strings":["Mechanical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","Mechanical Engineering, Korea Advanced Institute of Science and Technology, Yuseong-gu, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0001-6130-6589","affiliations":[{"raw_affiliation_string":"Mechanical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"Mechanical Engineering, Korea Advanced Institute of Science and Technology, Yuseong-gu, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064581452","display_name":"Sehoon Ha","orcid":"https://orcid.org/0000-0002-1972-328X"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sehoon Ha","raw_affiliation_strings":["Georgia Institute of Technology, Atlanta, GA, USA"],"raw_orcid":"https://orcid.org/0000-0002-1972-328X","affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19523278,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"10","issue":"11","first_page":"11466","last_page":"11473"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.6628000140190125},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.569599986076355},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.5221999883651733},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.44909998774528503},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.44290000200271606},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.41100001335144043},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.3749000132083893}],"concepts":[{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.6628000140190125},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5896999835968018},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.569599986076355},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.5221999883651733},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5194000005722046},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.44909998774528503},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.44290000200271606},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.41100001335144043},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4050999879837036},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.3749000132083893},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3743000030517578},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.36570000648498535},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3564000129699707},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.3208000063896179},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3028999865055084},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2903999984264374},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28929999470710754},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.28619998693466187},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C31531917","wikidata":"https://www.wikidata.org/wiki/Q915157","display_name":"Robust control","level":3,"score":0.25699999928474426}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/lra.2025.3608637","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3608637","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2504.09833","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.09833","pdf_url":"https://arxiv.org/pdf/2504.09833","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.09833","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.09833","pdf_url":"https://arxiv.org/pdf/2504.09833","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3552727025","display_name":null,"funder_award_id":"2339076","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320334879","display_name":"Korea Evaluation Institute of Industrial Technology","ror":"https://ror.org/03z9cwa38"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414110571.pdf","grobid_xml":"https://content.openalex.org/works/W4414110571.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W2061983716","https://openalex.org/W2138136244","https://openalex.org/W2143729862","https://openalex.org/W2158782408","https://openalex.org/W2539534359","https://openalex.org/W2738963603","https://openalex.org/W2907537824","https://openalex.org/W2911477000","https://openalex.org/W2972798201","https://openalex.org/W3039737909","https://openalex.org/W3093922502","https://openalex.org/W3175254947","https://openalex.org/W3176539729","https://openalex.org/W3206762371","https://openalex.org/W3206982864","https://openalex.org/W3207033168","https://openalex.org/W4205430897","https://openalex.org/W4283787029","https://openalex.org/W4285028015","https://openalex.org/W4286423847","https://openalex.org/W4297238282","https://openalex.org/W4311443585","https://openalex.org/W4312405101","https://openalex.org/W4385430486","https://openalex.org/W4385430644","https://openalex.org/W4385756627","https://openalex.org/W4387197141","https://openalex.org/W4392173735","https://openalex.org/W4394872716","https://openalex.org/W4401416934","https://openalex.org/W4402350775","https://openalex.org/W4404953355","https://openalex.org/W4405785534","https://openalex.org/W4405786155"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W230091440","https://openalex.org/W2390279801","https://openalex.org/W2233261550","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2810751659"],"abstract_inverted_index":{"Humanoid":[0],"locomotion":[1,40,58,144],"is":[2],"a":[3,31,38,47,130,136],"challenging":[4,63],"task":[5],"due":[6],"to":[7,19,21,54,113],"its":[8,52],"inherent":[9],"complexity":[10],"and":[11,23,65,87,126,142,152],"high-dimensional":[12],"dynamics,":[13],"as":[14,16,61],"well":[15],"the":[17,44,80,97,102,109,119],"need":[18],"adapt":[20],"diverse":[22,146],"unpredictable":[24],"environments.":[25],"In":[26,93],"this":[27],"work,":[28],"we":[29],"introduce":[30],"novel":[32],"learning":[33],"framework":[34,70,121],"for":[35],"effectively":[36],"training":[37],"humanoid":[39,132],"policy":[41,98],"that":[42],"imitates":[43],"behavior":[45],"of":[46,72,79,139],"model-based":[48,81,103],"controller":[49,104],"while":[50],"extending":[51],"capabilities":[53],"handle":[55],"more":[56,62],"complex":[57],"tasks,":[59],"such":[60],"terrain":[64],"higher":[66],"velocity":[67],"commands.":[68],"Our":[69],"consists":[71],"three":[73],"key":[74],"components:":[75],"pre-training":[76],"through":[77,122],"imitation":[78],"controller,":[82],"fine-tuning":[83],"via":[84],"reinforcement":[85],"learning,":[86],"model-assumption-based":[88],"regularization":[89],"(MAR)":[90],"during":[91],"fine-tuning.":[92],"particular,":[94],"MAR":[95],"aligns":[96],"with":[99],"actions":[100],"from":[101],"only":[105],"in":[106],"states":[107],"where":[108],"model":[110],"assumption":[111],"holds":[112],"prevent":[114],"catastrophic":[115],"forgetting.":[116],"We":[117],"evaluate":[118],"proposed":[120],"comprehensive":[123],"simulation":[124],"tests":[125],"hardware":[127],"experiments":[128],"on":[129],"full-size":[131],"robot,":[133],"Digit,":[134],"demonstrating":[135],"forward":[137],"speed":[138],"1.5":[140],"m/s":[141],"robust":[143],"across":[145],"terrains,":[147],"including":[148],"slippery,":[149],"sloped,":[150],"uneven,":[151],"sandy":[153],"terrains.":[154]},"counts_by_year":[],"updated_date":"2026-06-17T08:01:34.144755","created_date":"2025-10-10T00:00:00"}
