{"id":"https://openalex.org/W2791359174","doi":"https://doi.org/10.1109/robio.2017.8324507","title":"Hierarchical robot learning for physical collaboration between humans and robots","display_name":"Hierarchical robot learning for physical collaboration between humans and robots","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2791359174","doi":"https://doi.org/10.1109/robio.2017.8324507","mag":"2791359174"},"language":"en","primary_location":{"id":"doi:10.1109/robio.2017.8324507","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2017.8324507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005971230","display_name":"Zhen Deng","orcid":"https://orcid.org/0000-0002-0240-0919"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Zhen Deng","raw_affiliation_strings":["TAMS group, informatics, University of Hamburg, Hamburg"],"affiliations":[{"raw_affiliation_string":"TAMS group, informatics, University of Hamburg, Hamburg","institution_ids":["https://openalex.org/I159176309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030282812","display_name":"Jinpeng Mi","orcid":"https://orcid.org/0000-0002-0506-9707"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jinpeng Mi","raw_affiliation_strings":["TAMS group, informatics, University of Hamburg, Hamburg"],"affiliations":[{"raw_affiliation_string":"TAMS group, informatics, University of Hamburg, Hamburg","institution_ids":["https://openalex.org/I159176309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064621294","display_name":"Dong Han","orcid":"https://orcid.org/0000-0002-5167-9143"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Han","raw_affiliation_strings":["State Key Laboratory of Mechanics and Control of Mechanical Structures, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Mechanics and Control of Mechanical Structures, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007231606","display_name":"Rui Huang","orcid":"https://orcid.org/0000-0001-7231-5042"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Huang","raw_affiliation_strings":["Center for Robotics, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Center for Robotics, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072412582","display_name":"Xiaofeng Xiong","orcid":"https://orcid.org/0000-0001-5358-3498"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Xiaofeng Xiong","raw_affiliation_strings":["TAMS group, informatics, University of Hamburg, Hamburg"],"affiliations":[{"raw_affiliation_string":"TAMS group, informatics, University of Hamburg, Hamburg","institution_ids":["https://openalex.org/I159176309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100326970","display_name":"Jianwei Zhang","orcid":"https://orcid.org/0000-0002-7856-5760"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jianwei Zhang","raw_affiliation_strings":["TAMS group, informatics, University of Hamburg, Hamburg"],"affiliations":[{"raw_affiliation_string":"TAMS group, informatics, University of Hamburg, Hamburg","institution_ids":["https://openalex.org/I159176309"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5005971230"],"corresponding_institution_ids":["https://openalex.org/I159176309"],"apc_list":null,"apc_paid":null,"fwci":0.2012,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.57313042,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"750","last_page":"755"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9703999757766724,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.8372199535369873},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7042104005813599},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6774189472198486},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6353722214698792},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.5844319462776184},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4622172713279724},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.44968196749687195},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.4480220079421997},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.44025421142578125},{"id":"https://openalex.org/keywords/cognitive-robotics","display_name":"Cognitive robotics","score":0.41153275966644287},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.38445931673049927},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.351546049118042}],"concepts":[{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.8372199535369873},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7042104005813599},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6774189472198486},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6353722214698792},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.5844319462776184},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4622172713279724},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.44968196749687195},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.4480220079421997},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.44025421142578125},{"id":"https://openalex.org/C192327766","wikidata":"https://www.wikidata.org/wiki/Q1038799","display_name":"Cognitive robotics","level":3,"score":0.41153275966644287},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.38445931673049927},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.351546049118042},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio.2017.8324507","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2017.8324507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W121023703","https://openalex.org/W1516801383","https://openalex.org/W2012392077","https://openalex.org/W2098441518","https://openalex.org/W2105925198","https://openalex.org/W2111967991","https://openalex.org/W2143496582","https://openalex.org/W2151074445","https://openalex.org/W2167117957","https://openalex.org/W2169033759","https://openalex.org/W2169513627","https://openalex.org/W2170043047","https://openalex.org/W2295029210","https://openalex.org/W2333632897","https://openalex.org/W2414517470","https://openalex.org/W2415177987","https://openalex.org/W2559960928","https://openalex.org/W2563088602","https://openalex.org/W2964068416","https://openalex.org/W3139474403","https://openalex.org/W4255876299","https://openalex.org/W6604963999","https://openalex.org/W6653435097","https://openalex.org/W6674812091","https://openalex.org/W6676560026","https://openalex.org/W6681398095"],"related_works":["https://openalex.org/W2626077511","https://openalex.org/W3133699834","https://openalex.org/W1989753795","https://openalex.org/W2122546011","https://openalex.org/W2094878326","https://openalex.org/W92815668","https://openalex.org/W196519796","https://openalex.org/W2809775952","https://openalex.org/W2542622692","https://openalex.org/W2134294860"],"abstract_inverted_index":{"Human-in-the-loop":[0],"robot":[1,22,29,53,82,111,144],"learning":[2,18,23,30,54,59,66,124,140],"is":[3,67,91,105,126],"an":[4,95,153],"important":[5],"ability":[6],"for":[7,61,73],"robotics":[8],"in":[9],"human-robot":[10],"collaborative":[11],"(HRC)":[12],"tasks.":[13,63,159],"The":[14,132],"research":[15],"of":[16,43,81,116,134],"interactive":[17,87],"mainly":[19],"focuses":[20],"on":[21,128],"with":[24,31,102,113,148],"human":[25,32,44,89,119,150],"cognitive":[26],"interaction.":[27],"However,":[28],"physical":[33],"interaction":[34],"remains":[35],"a":[36,51,129,149],"challenging":[37],"problem,":[38],"due":[39],"to":[40,68,107,145,156],"the":[41,70,78,109,114,117,122,138,143,157],"stochastic":[42],"control.":[45],"In":[46,85],"this":[47],"paper,":[48],"we":[49],"present":[50],"hierarchical":[52],"approach":[55,125,141],"that":[56],"includes":[57],"two":[58],"hierarchies":[60],"HRC":[62,158],"High-level":[64],"motion":[65,71],"learn":[69],"policy":[72],"objects":[74],"which":[75],"used":[76],"as":[77],"shared":[79],"plan":[80],"and":[83,151],"human.":[84],"low-level":[86],"learning,":[88],"action":[90,112],"first":[92],"predicted":[93,118],"by":[94],"Extend":[96],"Kalman":[97],"Filter":[98],"(EKF)":[99],"algorithm.":[100],"Q-learning":[101],"function":[103],"approximation":[104],"applied":[106],"select":[108],"optimal":[110],"guidance":[115],"action.":[120],"Finally,":[121],"proposed":[123],"validated":[127],"UR5":[130],"robot.":[131],"results":[133],"our":[135],"experiments":[136],"show":[137],"presented":[139],"enables":[142],"adaptively":[146],"coordinate":[147],"produce":[152],"active":[154],"contribution":[155]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
