{"id":"https://openalex.org/W7133362971","doi":"https://doi.org/10.48550/arxiv.2603.00948","title":"HierKick: Hierarchical Reinforcement Learning for Vision-Guided Soccer Robot Control","display_name":"HierKick: Hierarchical Reinforcement Learning for Vision-Guided Soccer Robot Control","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133362971","doi":"https://doi.org/10.48550/arxiv.2603.00948"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00948","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00948","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00948","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127954160","display_name":"Yizhi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Yizhi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128009076","display_name":"Zheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022312971","display_name":"Zhanxiang Cao","orcid":"https://orcid.org/0009-0001-2961-2997"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Zhanxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127882068","display_name":"Yihe Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yihe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091423247","display_name":"S. Fu","orcid":"https://orcid.org/0000-0001-8745-5291"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Shengcheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123454841","display_name":"Liyun Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Liyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127895506","display_name":"Yang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082303610","display_name":"Jiali Liu","orcid":"https://orcid.org/0000-0001-5007-7813"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127949047","display_name":"Haoyang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Haoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128022439","display_name":"Yue Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yue","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5127954160"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6546000242233276,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.6546000242233276,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.1339000016450882,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.07280000299215317,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7455000281333923},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6525999903678894},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6473000049591064},{"id":"https://openalex.org/keywords/soccer-robot","display_name":"Soccer robot","score":0.6148999929428101},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.5054000020027161},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5008999705314636},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4993000030517578},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.4812000095844269},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.44679999351501465}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7455000281333923},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6525999903678894},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6473000049591064},{"id":"https://openalex.org/C2781188825","wikidata":"https://www.wikidata.org/wiki/Q7550336","display_name":"Soccer robot","level":5,"score":0.6148999929428101},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5483999848365784},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5008999705314636},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4993000030517578},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4848000109195709},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.4812000095844269},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.44679999351501465},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4058000147342682},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.39959999918937683},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.364300012588501},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.353300005197525},{"id":"https://openalex.org/C124527596","wikidata":"https://www.wikidata.org/wiki/Q17029359","display_name":"Hierarchical control system","level":3,"score":0.3495999872684479},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.34630000591278076},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.33399999141693115},{"id":"https://openalex.org/C82327864","wikidata":"https://www.wikidata.org/wiki/Q835100","display_name":"Intelligent control","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.2976999878883362},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C162947575","wikidata":"https://www.wikidata.org/wiki/Q2005645","display_name":"Social robot","level":5,"score":0.2745000123977661},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.26969999074935913},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.26179999113082886},{"id":"https://openalex.org/C118974865","wikidata":"https://www.wikidata.org/wiki/Q7300773","display_name":"Real-time Control System","level":3,"score":0.25450000166893005}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00948","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00948","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00948","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00948","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7242404222488403,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Controlling":[0],"soccer":[1,34],"robots":[2],"involves":[3],"multi-time-scale":[4,132],"decision-making,":[5],"which":[6],"requires":[7],"balancing":[8],"long-term":[9],"tactical":[10],"planning":[11],"and":[12,62,69,93,112,138],"short-term":[13],"motion":[14],"execution.":[15],"Traditional":[16],"end-to-end":[17],"reinforcement":[18],"learning":[19],"(RL)":[20],"methods":[21],"face":[22],"challenges":[23],"in":[24,107,110,114,127],"complex":[25,128],"dynamic":[26],"environments.":[27],"This":[28],"paper":[29],"proposes":[30],"HierKick,":[31],"a":[32,46,51,66,70,142],"vision-guided":[33],"robot":[35,125,147],"control":[36,48,126],"framework":[37,44,84,104],"based":[38],"on":[39],"dual-frequency":[40],"hierarchical":[41,47,122],"RL.":[42],"The":[43],"adopts":[45],"architecture":[49],"featuring":[50],"5":[52],"Hz":[53,73],"high-level":[54],"policy":[55],"that":[56,98],"integrates":[57],"YOLOv8":[58],"for":[59,76,124,145],"real-time":[60],"detection":[61],"selects":[63],"tasks":[64],"via":[65],"coach":[67],"model,":[68],"pre-trained":[71],"50":[72],"low-level":[74],"controller":[75],"precise":[77],"joint":[78],"control.":[79,148],"Through":[80],"this":[81,103],"architecture,":[82],"the":[83,86,99,115],"achieves":[85],"four":[87],"steps":[88],"of":[89,102],"approaching,":[90],"aligning,":[91],"dribbling,":[92],"kicking.":[94],"Experimental":[95],"results":[96],"show":[97],"success":[100],"rates":[101],"are":[105],"95.2\\%":[106],"IsaacGym,":[108],"89.8\\%":[109],"Mujoco,":[111],"80\\%":[113],"real":[116],"world.":[117],"HierKick":[118],"provides":[119],"an":[120],"effective":[121],"paradigm":[123],"environments,":[129],"extendable":[130],"to":[131],"tasks,":[133],"with":[134],"its":[135],"modular":[136],"design":[137],"skill":[139],"reuse":[140],"offering":[141],"new":[143],"path":[144],"intelligent":[146]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
