{"id":"https://openalex.org/W3090211586","doi":"https://doi.org/10.1109/icra40945.2020.9196924","title":"Towards Safe Human-Robot Collaboration Using Deep Reinforcement Learning","display_name":"Towards Safe Human-Robot Collaboration Using Deep Reinforcement Learning","publication_year":2020,"publication_date":"2020-05-01","ids":{"openalex":"https://openalex.org/W3090211586","doi":"https://doi.org/10.1109/icra40945.2020.9196924","mag":"3090211586"},"language":"en","primary_location":{"id":"doi:10.1109/icra40945.2020.9196924","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra40945.2020.9196924","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031175358","display_name":"Mohamed El-Shamouty","orcid":null},"institutions":[{"id":"https://openalex.org/I3018473509","display_name":"Fraunhofer Institute for Manufacturing Engineering and Automation","ror":"https://ror.org/01rvqha10","country_code":"DE","type":"facility","lineage":["https://openalex.org/I3018473509","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Mohamed El-Shamouty","raw_affiliation_strings":["Fraunhofer IPA,Department of Robot and Assistive Systems","Department of Robot and Assistive Systems, Fraunhofer IPA"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IPA,Department of Robot and Assistive Systems","institution_ids":["https://openalex.org/I3018473509"]},{"raw_affiliation_string":"Department of Robot and Assistive Systems, Fraunhofer IPA","institution_ids":["https://openalex.org/I3018473509"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023442148","display_name":"Xinyang Wu","orcid":"https://orcid.org/0000-0002-8912-2041"},"institutions":[{"id":"https://openalex.org/I3018473509","display_name":"Fraunhofer Institute for Manufacturing Engineering and Automation","ror":"https://ror.org/01rvqha10","country_code":"DE","type":"facility","lineage":["https://openalex.org/I3018473509","https://openalex.org/I4923324"]},{"id":"https://openalex.org/I4210127444","display_name":"Fraunhofer Institute for Cognitive Systems","ror":"https://ror.org/02fez3815","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210127444","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Xinyang Wu","raw_affiliation_strings":["Fraunhofer IPA,Center for Cyber Cognitive Intelligence","Center for Cyber Cognitive Intelligence, Fraunhofer IPA"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IPA,Center for Cyber Cognitive Intelligence","institution_ids":["https://openalex.org/I4210127444"]},{"raw_affiliation_string":"Center for Cyber Cognitive Intelligence, Fraunhofer IPA","institution_ids":["https://openalex.org/I3018473509"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049948049","display_name":"Shanqi Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I3018473509","display_name":"Fraunhofer Institute for Manufacturing Engineering and Automation","ror":"https://ror.org/01rvqha10","country_code":"DE","type":"facility","lineage":["https://openalex.org/I3018473509","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Shanqi Yang","raw_affiliation_strings":["Fraunhofer IPA,Department of Robot and Assistive Systems","Department of Robot and Assistive Systems, Fraunhofer IPA"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IPA,Department of Robot and Assistive Systems","institution_ids":["https://openalex.org/I3018473509"]},{"raw_affiliation_string":"Department of Robot and Assistive Systems, Fraunhofer IPA","institution_ids":["https://openalex.org/I3018473509"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000203676","display_name":"Marcel Albus","orcid":"https://orcid.org/0000-0002-7390-4081"},"institutions":[{"id":"https://openalex.org/I3018473509","display_name":"Fraunhofer Institute for Manufacturing Engineering and Automation","ror":"https://ror.org/01rvqha10","country_code":"DE","type":"facility","lineage":["https://openalex.org/I3018473509","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marcel Albus","raw_affiliation_strings":["Fraunhofer IPA,Department of Robot and Assistive Systems","Department of Robot and Assistive Systems, Fraunhofer IPA"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IPA,Department of Robot and Assistive Systems","institution_ids":["https://openalex.org/I3018473509"]},{"raw_affiliation_string":"Department of Robot and Assistive Systems, Fraunhofer IPA","institution_ids":["https://openalex.org/I3018473509"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031354877","display_name":"Marco F. Huber","orcid":"https://orcid.org/0000-0002-8250-2092"},"institutions":[{"id":"https://openalex.org/I4210127444","display_name":"Fraunhofer Institute for Cognitive Systems","ror":"https://ror.org/02fez3815","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210127444","https://openalex.org/I4923324"]},{"id":"https://openalex.org/I3018473509","display_name":"Fraunhofer Institute for Manufacturing Engineering and Automation","ror":"https://ror.org/01rvqha10","country_code":"DE","type":"facility","lineage":["https://openalex.org/I3018473509","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marco F. Huber","raw_affiliation_strings":["Fraunhofer IPA,Center for Cyber Cognitive Intelligence","Center for Cyber Cognitive Intelligence, Fraunhofer IPA"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IPA,Center for Cyber Cognitive Intelligence","institution_ids":["https://openalex.org/I4210127444"]},{"raw_affiliation_string":"Center for Cyber Cognitive Intelligence, Fraunhofer IPA","institution_ids":["https://openalex.org/I3018473509"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5031175358"],"corresponding_institution_ids":["https://openalex.org/I3018473509"],"apc_list":null,"apc_paid":null,"fwci":4.0775,"has_fulltext":false,"cited_by_count":62,"citation_normalized_percentile":{"value":0.94984751,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4899","last_page":"4905"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9625999927520752,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8168423771858215},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7357653379440308},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7200657725334167},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6543712019920349},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6311803460121155},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5444603562355042},{"id":"https://openalex.org/keywords/control-reconfiguration","display_name":"Control reconfiguration","score":0.5006473064422607},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48518115282058716},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.4221314489841461},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.34513890743255615},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.22668448090553284},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20425915718078613},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.19645124673843384},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.19420939683914185},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.11911231279373169}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8168423771858215},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7357653379440308},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7200657725334167},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6543712019920349},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6311803460121155},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5444603562355042},{"id":"https://openalex.org/C119701452","wikidata":"https://www.wikidata.org/wiki/Q5165881","display_name":"Control reconfiguration","level":2,"score":0.5006473064422607},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48518115282058716},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.4221314489841461},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.34513890743255615},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.22668448090553284},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20425915718078613},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.19645124673843384},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.19420939683914185},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.11911231279373169},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/icra40945.2020.9196924","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra40945.2020.9196924","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},{"id":"pmh:oai:fraunhofer.de:N-608506","is_oa":false,"landing_page_url":"http://publica.fraunhofer.de/documents/N-608506.html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400801","display_name":"Publikationsdatenbank der Fraunhofer-Gesellschaft (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Fraunhofer IPA","raw_type":"Conference Paper"},{"id":"pmh:oai:publica.fraunhofer.de:publica/409142","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/409142","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":60,"referenced_works":["https://openalex.org/W749877177","https://openalex.org/W1845972764","https://openalex.org/W1944528098","https://openalex.org/W1967821692","https://openalex.org/W2055672407","https://openalex.org/W2121863487","https://openalex.org/W2122410182","https://openalex.org/W2145339207","https://openalex.org/W2155007355","https://openalex.org/W2155027007","https://openalex.org/W2158782408","https://openalex.org/W2173248099","https://openalex.org/W2284548247","https://openalex.org/W2462906003","https://openalex.org/W2575705757","https://openalex.org/W2611616978","https://openalex.org/W2618852836","https://openalex.org/W2624731731","https://openalex.org/W2736601468","https://openalex.org/W2746597156","https://openalex.org/W2753092418","https://openalex.org/W2754517384","https://openalex.org/W2783712532","https://openalex.org/W2784465508","https://openalex.org/W2796290181","https://openalex.org/W2899059606","https://openalex.org/W2915877178","https://openalex.org/W2944221325","https://openalex.org/W2950892788","https://openalex.org/W2962803570","https://openalex.org/W2962879844","https://openalex.org/W2963040191","https://openalex.org/W2963120839","https://openalex.org/W2963293747","https://openalex.org/W2963731007","https://openalex.org/W2963864421","https://openalex.org/W2964001908","https://openalex.org/W2964161785","https://openalex.org/W3008885639","https://openalex.org/W3104515094","https://openalex.org/W3107489946","https://openalex.org/W4214717370","https://openalex.org/W4229856339","https://openalex.org/W4293275986","https://openalex.org/W4293545785","https://openalex.org/W4300799055","https://openalex.org/W6682849425","https://openalex.org/W6683204974","https://openalex.org/W6684921986","https://openalex.org/W6695920968","https://openalex.org/W6718836005","https://openalex.org/W6737893269","https://openalex.org/W6740801417","https://openalex.org/W6741002519","https://openalex.org/W6744086685","https://openalex.org/W6747790125","https://openalex.org/W6755421158","https://openalex.org/W6761557609","https://openalex.org/W6762143477","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W2595172197","https://openalex.org/W1981002473","https://openalex.org/W2084856301","https://openalex.org/W2127970246","https://openalex.org/W2357657342","https://openalex.org/W2885125400","https://openalex.org/W1989889224","https://openalex.org/W4382618745","https://openalex.org/W2356280555","https://openalex.org/W2742483371"],"abstract_inverted_index":{"Safety":[0],"in":[1,10,41,81,159],"Human-Robot":[2],"Collaboration":[3],"(HRC)":[4],"is":[5],"a":[6,63,95],"bottleneck":[7],"to":[8,48,56,73,98,133],"HRC-productivity":[9],"industry.":[11,134],"With":[12],"robots":[13,80,154],"being":[14],"the":[15,54,79,90,100,136,138,142,160],"main":[16],"source":[17],"of":[18,53,78,107,144],"hazards,":[19],"safety":[20,24,77,103],"engineers":[21],"use":[22],"over-emphasized":[23],"measures,":[25],"and":[26,30,51,76,102,105,122],"carry":[27],"out":[28],"lengthy":[29],"expensive":[31],"risk":[32],"assessment":[33],"processes":[34],"on":[35,152],"each":[36],"HRC-layout":[37],"reconfiguration.":[38],"Recent":[39],"advances":[40],"deep":[42,67,145],"Reinforcement":[43],"Learning":[44],"(RL)":[45],"offer":[46],"solutions":[47],"add":[49],"intelligence":[50,75],"comprehensibility":[52],"environment":[55],"robots.":[57,91],"In":[58,135],"this":[59],"paper,":[60],"we":[61],"propose":[62],"framework":[64,93,113,140],"that":[65],"uses":[66],"RL":[68,110,146],"as":[69,119,157],"an":[70],"enabling":[71],"technology":[72],"enhance":[74],"HRC":[82],"scenarios":[83],"and,":[84],"thus,":[85],"reduce":[86],"hazards":[87],"incurred":[88],"by":[89],"The":[92,112],"offers":[94],"systematic":[96],"methodology":[97],"encode":[99],"task":[101],"requirements":[104],"context":[106],"applicability":[108],"into":[109],"settings.":[111],"also":[114],"considers":[115],"core":[116],"components,":[117],"such":[118],"behavior":[120],"explainer":[121],"verifier,":[123],"which":[124],"aim":[125],"for":[126],"transferring":[127],"learned":[128],"behaviors":[129],"from":[130],"research":[131],"labs":[132],"evaluations,":[137],"proposed":[139],"shows":[141],"capability":[143],"agents":[147],"learning":[148],"collision-free":[149],"point-to-point":[150],"motion":[151],"different":[153],"inside":[155],"simulation,":[156],"shown":[158],"supplementary":[161],"video.":[162]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
