{"id":"https://openalex.org/W7160441849","doi":"https://doi.org/10.48550/arxiv.2605.03363","title":"Learning Reactive Dexterous Grasping via Hierarchical Task-Space RL Planning and Joint-Space QP Control","display_name":"Learning Reactive Dexterous Grasping via Hierarchical Task-Space RL Planning and Joint-Space QP Control","publication_year":2026,"publication_date":"2026-05-05","ids":{"openalex":"https://openalex.org/W7160441849","doi":"https://doi.org/10.48550/arxiv.2605.03363"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.03363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.03363","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101809126","display_name":"Ho Jae Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Ho Jae","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135511170","display_name":"Yonghyeon Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Yonghyeon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120651328","display_name":"Alexander Alexiev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexiev, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101958946","display_name":"Tzu-Yuan Lin","orcid":"https://orcid.org/0000-0002-3442-8801"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Tzu-Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033224913","display_name":"Se Hwan Jeon","orcid":"https://orcid.org/0000-0002-2791-7850"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeon, Se Hwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135452893","display_name":"Sangbae Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Sangbae","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9244999885559082,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9244999885559082,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.029600000008940697,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.022600000724196434,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.6306999921798706},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5774000287055969},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5465999841690063},{"id":"https://openalex.org/keywords/quadratic-programming","display_name":"Quadratic programming","score":0.4984999895095825},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.4945000112056732},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.49410000443458557},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.429500013589859},{"id":"https://openalex.org/keywords/robotic-arm","display_name":"Robotic arm","score":0.36899998784065247},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.36579999327659607},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.3653999865055084}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6565999984741211},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.6306999921798706},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5774000287055969},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5465999841690063},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.4984999895095825},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.4945000112056732},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.49410000443458557},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44749999046325684},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.429500013589859},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.41940000653266907},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.36899998784065247},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.3653999865055084},{"id":"https://openalex.org/C2775960376","wikidata":"https://www.wikidata.org/wiki/Q1435859","display_name":"Grippers","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.3517000079154968},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.3400999903678894},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.32510000467300415},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.3163999915122986},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3163999915122986},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.3091999888420105},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2888000011444092},{"id":"https://openalex.org/C31531917","wikidata":"https://www.wikidata.org/wiki/Q915157","display_name":"Robust control","level":3,"score":0.2856000065803528},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.28130000829696655},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.2711000144481659},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.26910001039505005},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.25850000977516174},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.03363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.03363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6476701498031616,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3],"propose":[4],"a":[5,26,41,56,119,127,132,145],"hybrid":[6],"hierarchical":[7],"control":[8],"framework":[9,117],"for":[10,141],"reactive":[11],"dexterous":[12,142],"grasping":[13,143],"that":[14,38],"explicitly":[15],"decouples":[16],"high-level":[17,42],"spatial":[18],"intent":[19],"from":[20,158],"low-level":[21],"joint":[22,66],"execution.":[23],"We":[24,112],"introduce":[25],"multi-agent":[27],"reinforcement":[28],"learning":[29],"architecture,":[30],"specialized":[31],"into":[32,64],"distinct":[33],"arm":[34,129],"and":[35,73,104],"hand":[36,135],"agents,":[37],"acts":[39],"as":[40],"planner":[43],"by":[44,55],"generating":[45],"desired":[46],"task-space":[47],"velocity":[48],"commands.":[49],"These":[50],"commands":[51],"are":[52],"then":[53],"processed":[54],"GPU-parallelized":[57],"quadratic":[58],"programming":[59],"controller,":[60],"which":[61],"translates":[62],"them":[63],"feasible":[65],"velocities":[67],"while":[68],"strictly":[69,86],"enforcing":[70],"kinematic":[71],"limits":[72],"collision":[74],"avoidance.":[75],"This":[76],"structural":[77],"isolation":[78],"not":[79],"only":[80],"accelerates":[81],"training":[82],"convergence":[83],"but":[84],"also":[85],"enforces":[87],"hardware":[88,124],"safety.":[89],"Furthermore,":[90],"the":[91,110,115,152],"architecture":[92],"unlocks":[93],"zero-shot":[94,139],"steerability,":[95],"allowing":[96],"system":[97],"operators":[98],"to":[99,144,155],"dynamically":[100],"adjust":[101],"safety":[102],"margins":[103],"avoid":[105],"dynamic":[106],"obstacles":[107],"without":[108],"retraining":[109],"policy.":[111],"extensively":[113],"validate":[114],"proposed":[116],"through":[118],"rigorous":[120],"simulation-to-reality":[121],"pipeline.":[122],"Real-world":[123],"experiments":[125],"on":[126],"7-DoF":[128],"equipped":[130],"with":[131],"20-DoF":[133],"anthropomorphic":[134],"demonstrate":[136],"highly":[137],"robust":[138],"transferability":[140],"diverse":[146],"set":[147],"of":[148],"unseen":[149],"objects,":[150],"highlighting":[151],"system's":[153],"ability":[154],"reactively":[156],"recover":[157],"unexpected":[159],"physical":[160],"disturbances":[161],"in":[162],"unstructured":[163],"environments.":[164]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-07T00:00:00"}
