{"id":"https://openalex.org/W3195643803","doi":"https://doi.org/10.1109/iros51168.2021.9636426","title":"Monolithic vs. hybrid controller for multi-objective Sim-to-Real learning","display_name":"Monolithic vs. hybrid controller for multi-objective Sim-to-Real learning","publication_year":2021,"publication_date":"2021-09-27","ids":{"openalex":"https://openalex.org/W3195643803","doi":"https://doi.org/10.1109/iros51168.2021.9636426","mag":"3195643803"},"language":"en","primary_location":{"id":"doi:10.1109/iros51168.2021.9636426","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros51168.2021.9636426","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040763124","display_name":"Atakan Dag","orcid":null},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Atakan Dag","raw_affiliation_strings":["Computing Sciences, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066519992","display_name":"Alexandre Angleraud","orcid":"https://orcid.org/0000-0002-2291-1329"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Alexandre Angleraud","raw_affiliation_strings":["Automation Technology and Mechanical Engineering, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Automation Technology and Mechanical Engineering, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108053789","display_name":"Wenyan Yang","orcid":"https://orcid.org/0000-0003-0016-4921"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Wenyan Yang","raw_affiliation_strings":["Computing Sciences, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048830674","display_name":"Nataliya Strokina","orcid":"https://orcid.org/0000-0002-7352-445X"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Nataliya Strokina","raw_affiliation_strings":["Computing Sciences, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077269216","display_name":"Roel Pieters","orcid":"https://orcid.org/0000-0001-6728-304X"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Roel S. Pieters","raw_affiliation_strings":["Automation Technology and Mechanical Engineering, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Automation Technology and Mechanical Engineering, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034363573","display_name":"Minna Lanz","orcid":"https://orcid.org/0000-0003-2182-4669"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Minna Lanz","raw_affiliation_strings":["Automation Technology and Mechanical Engineering, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Automation Technology and Mechanical Engineering, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054822570","display_name":"Joni\u2010Kristian K\u00e4m\u00e4r\u00e4inen","orcid":"https://orcid.org/0000-0002-5801-4371"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Joni-Kristian Kamarainen","raw_affiliation_strings":["Computing Sciences, Tampere University, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing Sciences, Tampere University, Finland","institution_ids":["https://openalex.org/I166825849"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08022181,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4576","last_page":"4582"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12810","display_name":"Real-time simulation and control systems","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7261085510253906},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.7018451690673828},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6943148374557495},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5842540264129639},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5783241987228394},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5504608154296875},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.5405089259147644},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.49414828419685364},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.45545923709869385},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.42075905203819275},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.41202592849731445},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3293432891368866},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.28862571716308594},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15803003311157227},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08127698302268982}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7261085510253906},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.7018451690673828},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6943148374557495},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5842540264129639},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5783241987228394},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5504608154296875},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.5405089259147644},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.49414828419685364},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.45545923709869385},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.42075905203819275},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41202592849731445},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3293432891368866},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.28862571716308594},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15803003311157227},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08127698302268982},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros51168.2021.9636426","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros51168.2021.9636426","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1987725948","https://openalex.org/W1998649829","https://openalex.org/W2091565802","https://openalex.org/W2100677568","https://openalex.org/W2119717200","https://openalex.org/W2121863487","https://openalex.org/W2155027007","https://openalex.org/W2165150801","https://openalex.org/W2534269850","https://openalex.org/W2565233142","https://openalex.org/W2733961795","https://openalex.org/W2767050701","https://openalex.org/W2810519341","https://openalex.org/W2899460553","https://openalex.org/W2901136733","https://openalex.org/W2902067689","https://openalex.org/W2921851574","https://openalex.org/W2952629144","https://openalex.org/W2954718200","https://openalex.org/W2963293747","https://openalex.org/W2963504951","https://openalex.org/W2963864421","https://openalex.org/W2991403870","https://openalex.org/W3000059385","https://openalex.org/W3004325772","https://openalex.org/W3005431655","https://openalex.org/W3011120880","https://openalex.org/W3025701928","https://openalex.org/W3034757316","https://openalex.org/W3038610377","https://openalex.org/W3041202696","https://openalex.org/W3089353688","https://openalex.org/W3101442004","https://openalex.org/W4297686387","https://openalex.org/W4300799055","https://openalex.org/W4302570325","https://openalex.org/W6647175844","https://openalex.org/W6683204974","https://openalex.org/W6684205842","https://openalex.org/W6684921986","https://openalex.org/W6728925229","https://openalex.org/W6740801417","https://openalex.org/W6752330529","https://openalex.org/W6752818329","https://openalex.org/W6756486208","https://openalex.org/W6756581457","https://openalex.org/W6764769363","https://openalex.org/W6775686901","https://openalex.org/W6779795787"],"related_works":["https://openalex.org/W2794103424","https://openalex.org/W4245435724","https://openalex.org/W3028317537","https://openalex.org/W2389515972","https://openalex.org/W1996530509","https://openalex.org/W2376554934","https://openalex.org/W2077790809","https://openalex.org/W2906246018","https://openalex.org/W1505959757","https://openalex.org/W2055301889"],"abstract_inverted_index":{"Simulation":[0],"to":[1,8,17,20,70,119],"real":[2,158],"(Sim-to-Real)":[3],"is":[4,69,137],"an":[5,125],"attractive":[6],"approach":[7],"construct":[9],"controllers":[10,94,150],"for":[11,29],"robotic":[12],"tasks":[13,30],"that":[14,130],"are":[15],"easier":[16,138],"simulate":[18],"than":[19,145],"analytically":[21],"solve.":[22],"Working":[23],"Sim-to-Real":[24],"solutions":[25],"have":[26],"been":[27],"demonstrated":[28],"with":[31],"a":[32,75,81,86,96,116,121,134,141,146,157],"clear":[33],"single":[34,82,92],"objective":[35,93],"such":[36,51],"as":[37,52],"\"reach":[38,53],"the":[39,54,63,112,131],"target\".":[40],"Real":[41],"world":[42],"applications,":[43],"however,":[44],"often":[45],"consist":[46],"of":[47,65,115,133],"multiple":[48,72],"simultaneous":[49],"objectives":[50,73],"target\"":[55],"but":[56],"\"avoid":[57],"obstacles\".":[58],"A":[59],"straightforward":[60],"solution":[61,88],"in":[62,111,152],"context":[64],"reinforcement":[66],"learning":[67],"(RL)":[68],"combine":[71],"into":[74],"multi-term":[76],"reward":[77],"function":[78],"and":[79,95,139],"train":[80],"monolithic":[83,147],"controller.":[84,148],"Recently,":[85],"hybrid":[87,135],"based":[89],"on":[90],"pre-trained":[91],"switching":[97],"rule":[98],"between":[99],"them":[100],"was":[101],"proposed.":[102],"In":[103],"this":[104],"work,":[105],"we":[106],"compare":[107],"these":[108],"two":[109],"approaches":[110],"multi-objective":[113],"setting":[114],"robot":[117],"manipulator":[118],"reach":[120],"target":[122],"while":[123],"avoiding":[124],"obstacle.":[126],"Our":[127],"findings":[128],"show":[129],"training":[132],"controller":[136],"obtains":[140],"better":[142],"success-failure":[143],"trade-off":[144],"The":[149],"trained":[151],"simulator":[153],"were":[154],"verified":[155],"by":[156],"set-up.":[159]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
