{"id":"https://openalex.org/W7134247770","doi":"https://doi.org/10.48550/arxiv.2603.05783","title":"Task-Level Decisions to Gait Level Control: A Hierarchical Policy Approach for Quadruped Navigation","display_name":"Task-Level Decisions to Gait Level Control: A Hierarchical Policy Approach for Quadruped Navigation","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7134247770","doi":"https://doi.org/10.48550/arxiv.2603.05783"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.05783","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128626702","display_name":"Sijia Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Sijia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128455244","display_name":"Haoyu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haoyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128455164","display_name":"Shenghai Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Shenghai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113700322","display_name":"Yizhuo Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yizhuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084760653","display_name":"Thien\u2010Minh Nguyen","orcid":"https://orcid.org/0000-0003-1315-0967"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Thien-Minh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5128626702"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.4530999958515167,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.4530999958515167,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.06909999996423721,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.05730000138282776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.6970000267028809},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6425999999046326},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5460000038146973},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5396999716758728},{"id":"https://openalex.org/keywords/gait","display_name":"Gait","score":0.5307999849319458},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.45899999141693115},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4377000033855438},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.42340001463890076}],"concepts":[{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.6970000267028809},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6425999999046326},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6129000186920166},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5460000038146973},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5396999716758728},{"id":"https://openalex.org/C151800584","wikidata":"https://www.wikidata.org/wiki/Q2370000","display_name":"Gait","level":2,"score":0.5307999849319458},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.45899999141693115},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4433000087738037},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4377000033855438},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.42340001463890076},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4077000021934509},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.39890000224113464},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3564999997615814},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.34450000524520874},{"id":"https://openalex.org/C134181672","wikidata":"https://www.wikidata.org/wiki/Q21907045","display_name":"Quadrupedalism","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28850001096725464},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.28839999437332153},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2587999999523163}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.05783","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.05783","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.05783","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.05783","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Real-world":[0],"quadruped":[1],"navigation":[2,11],"is":[3],"constrained":[4],"by":[5,20],"a":[6,47,78,112,142],"scale":[7],"mismatch":[8],"between":[9],"high-level":[10,93],"decisions":[12,97],"and":[13,31,73,89,105,137,152,164],"low-level":[14,62,109],"gait":[15],"execution,":[16],"as":[17,19],"well":[18],"instabilities":[21],"under":[22],"out-of-distribution":[23,165],"environmental":[24,150],"changes.":[25],"Such":[26],"variations":[27],"challenge":[28],"sim-to-real":[29],"transfer":[30],"can":[32],"trigger":[33],"falls":[34],"when":[35],"policies":[36],"lack":[37],"explicit":[38,130],"interfaces":[39,131],"for":[40,51,132],"adaptation.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45],"present":[46],"hierarchical":[48],"policy":[49,94,138],"architecture":[50,128],"quadrupedal":[52],"navigation,":[53],"termed":[54],"Task-level":[55],"Decision":[56],"to":[57,77],"Gait":[58],"Control":[59],"(TDGC).":[60],"A":[61,92],"policy,":[63],"trained":[64],"with":[65,145],"reinforcement":[66],"learning":[67],"in":[68],"simulation,":[69],"delivers":[70],"gait-conditioned":[71],"locomotion":[72],"maps":[74,118],"task":[75,158],"requirements":[76],"compact":[79],"set":[80],"of":[81],"controllable":[82],"behavior":[83],"parameters,":[84],"enabling":[85],"robust":[86],"mode":[87],"generation":[88],"smooth":[90],"switching.":[91],"makes":[95],"task-centric":[96],"from":[98,124],"sparse":[99],"semantic":[100],"or":[101,119],"geometric":[102],"terrain":[103,121],"cues":[104],"translates":[106],"them":[107],"into":[108],"targets,":[110],"forming":[111],"traceable":[113],"decision":[114],"pipeline":[115],"without":[116],"dense":[117],"high-resolution":[120],"reconstruction.":[122],"Different":[123],"end-to-end":[125],"approaches,":[126],"our":[127],"provides":[129],"deployment-time":[133],"tuning,":[134],"fault":[135],"diagnosis,":[136],"refinement.":[139],"We":[140],"introduce":[141],"structured":[143],"curriculum":[144],"performance-driven":[146],"progression":[147],"that":[148],"expands":[149],"difficulty":[151],"disturbance":[153],"ranges.":[154],"Experiments":[155],"show":[156],"higher":[157],"success":[159],"rates":[160],"on":[161],"mixed":[162],"terrains":[163],"tests.":[166]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-10T00:00:00"}
