{"id":"https://openalex.org/W4294975945","doi":"https://doi.org/10.1109/mmar55195.2022.9874304","title":"Sim2Real Deep Reinforcement Learning of Compliance-based Robotic Assembly Operations","display_name":"Sim2Real Deep Reinforcement Learning of Compliance-based Robotic Assembly Operations","publication_year":2022,"publication_date":"2022-08-22","ids":{"openalex":"https://openalex.org/W4294975945","doi":"https://doi.org/10.1109/mmar55195.2022.9874304"},"language":"en","primary_location":{"id":"doi:10.1109/mmar55195.2022.9874304","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmar55195.2022.9874304","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Methods and Models in Automation and Robotics (MMAR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018580542","display_name":"Oliver Petrovi\u0107","orcid":"https://orcid.org/0000-0002-4861-1332"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Oliver Petrovic","raw_affiliation_strings":["RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102746855","display_name":"Lukas Sch\u00e4per","orcid":"https://orcid.org/0000-0003-3767-3084"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lukas Schaper","raw_affiliation_strings":["RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038342733","display_name":"Simon Roggendorf","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Roggendorf","raw_affiliation_strings":["RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108724527","display_name":"Simon Storms","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Storms","raw_affiliation_strings":["RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067996292","display_name":"Christian Brecher","orcid":"https://orcid.org/0000-0002-8049-3364"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christian Brecher","raw_affiliation_strings":["RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Laboratory for Machine Tools and Production Engineering (WZL),Department of Automation and Control Chair of Machine Tools,Aachen,Germany,52074","institution_ids":["https://openalex.org/I887968799"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5018580542"],"corresponding_institution_ids":["https://openalex.org/I887968799"],"apc_list":null,"apc_paid":null,"fwci":0.964,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.74004168,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"300","last_page":"305"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7828015089035034},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7129718065261841},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6873652935028076},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6433203220367432},{"id":"https://openalex.org/keywords/workspace","display_name":"Workspace","score":0.5676319003105164},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4636681377887726},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.43250036239624023},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4021160304546356},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3480517566204071},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20634576678276062}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7828015089035034},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7129718065261841},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6873652935028076},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6433203220367432},{"id":"https://openalex.org/C58581272","wikidata":"https://www.wikidata.org/wiki/Q12741163","display_name":"Workspace","level":3,"score":0.5676319003105164},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4636681377887726},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.43250036239624023},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4021160304546356},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3480517566204071},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20634576678276062},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mmar55195.2022.9874304","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmar55195.2022.9874304","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Methods and Models in Automation and Robotics (MMAR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2155007355","https://openalex.org/W2167340365","https://openalex.org/W2772607898","https://openalex.org/W2781726626","https://openalex.org/W2904246096","https://openalex.org/W2952526277","https://openalex.org/W2963184939","https://openalex.org/W2963940579","https://openalex.org/W2964006217","https://openalex.org/W2968116426","https://openalex.org/W3004070224","https://openalex.org/W3012366945","https://openalex.org/W3081200565","https://openalex.org/W3100789280","https://openalex.org/W3101875589","https://openalex.org/W3130451601","https://openalex.org/W3130984490","https://openalex.org/W3131031071","https://openalex.org/W3132082252","https://openalex.org/W3207601508","https://openalex.org/W6639949747","https://openalex.org/W6682849425","https://openalex.org/W6747473740","https://openalex.org/W6757592117","https://openalex.org/W6760698134","https://openalex.org/W6785056100"],"related_works":["https://openalex.org/W2024276883","https://openalex.org/W3008208197","https://openalex.org/W2943265406","https://openalex.org/W4288361573","https://openalex.org/W3186042173","https://openalex.org/W1541885547","https://openalex.org/W4200097666","https://openalex.org/W2765383930","https://openalex.org/W3216202865","https://openalex.org/W2483341005"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,63],"(RL)":[2],"enables":[3],"robots":[4],"to":[5,26,32,53,89,107,145,165,171],"learn":[6,54],"goal-oriented":[7],"behavior.":[8],"In":[9,46],"production":[10],"processes":[11],"with":[12],"high":[13],"variances,":[14],"such":[15],"as":[16],"joining":[17],"operations":[18],"in":[19,74,82,128,132,156],"end-of-line":[20],"assembly,":[21],"this":[22,47],"is":[23,42,152],"particularly":[24],"interesting":[25],"save":[27],"significant":[28],"programming":[29],"effort.":[30],"Due":[31],"a":[33,55,66,121,162],"large":[34],"amount":[35],"of":[36,86,95,103],"required":[37],"training":[38,41,109,143],"data,":[39],"simulative":[40],"becoming":[43],"increasingly":[44],"important.":[45],"paper,":[48],"we":[49],"present":[50],"an":[51,117],"approach":[52],"contact-rich":[56],"peg-in-hole":[57],"assembly":[58],"task":[59],"utilizing":[60],"deep":[61],"reinforcement":[62],"(DRL)":[64],"and":[65,80,93,106,135,160],"compliant":[67],"robot":[68],"controller.":[69],"The":[70,149],"DRL-Agent":[71],"learns":[72],"directly":[73],"the":[75,83,87,91,96,101,104,133,137,141,157],"Cartesian":[76],"space":[77,85],"(task":[78],"space)":[79],"not":[81],"joint":[84],"robot,":[88,139,164],"increase":[90,100],"robustness":[92,102],"efficiency":[94],"algorithms.":[97],"To":[98],"further":[99],"policy":[105,151],"shorten":[108],"times,":[110],"geometric":[111],"limitations":[112,126],"are":[113],"imposed":[114],"by":[115],"introducing":[116],"admissible":[118],"workspace":[119],"using":[120],"trajectory":[122],"generator.":[123],"Furthermore,":[124],"these":[125],"result":[127],"nearly":[129],"identical":[130],"behavior":[131],"simulation":[134,158,170],"on":[136,161],"real":[138,163],"allowing":[140],"DRL":[142],"process":[144],"be":[146],"purely":[147],"simulative.":[148],"learned":[150],"experimentally":[153],"investigated":[154],"both":[155],"environment":[159],"evaluate":[166],"its":[167],"transferability":[168],"from":[169],"reality":[172],"(sim2real).":[173]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
