{"id":"https://openalex.org/W4390939340","doi":"https://doi.org/10.1109/access.2024.3355311","title":"Data-Efficient Reinforcement Learning for Variable Impedance Control","display_name":"Data-Efficient Reinforcement Learning for Variable Impedance Control","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4390939340","doi":"https://doi.org/10.1109/access.2024.3355311"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3355311","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3355311","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10401924.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10401924.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046127916","display_name":"Akhil S Anand","orcid":"https://orcid.org/0000-0002-3121-578X"},"institutions":[{"id":"https://openalex.org/I204778367","display_name":"Norwegian University of Science and Technology","ror":"https://ror.org/05xg72x27","country_code":"NO","type":"education","lineage":["https://openalex.org/I204778367"]}],"countries":["NO"],"is_corresponding":true,"raw_author_name":"Akhil S. Anand","raw_affiliation_strings":["Department of Engineering Cybernetics, Norwegian University of Science and Technology (NTNU), Trondheim, Norway"],"raw_orcid":"https://orcid.org/0000-0002-3121-578X","affiliations":[{"raw_affiliation_string":"Department of Engineering Cybernetics, Norwegian University of Science and Technology (NTNU), Trondheim, Norway","institution_ids":["https://openalex.org/I204778367"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072492839","display_name":"Rituraj Kaushik","orcid":"https://orcid.org/0000-0003-2598-8804"},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Rituraj Kaushik","raw_affiliation_strings":["Department of Electrical Engineering and Automation (EEA), Intelligent Robotics Group, Aalto University, Espoo, Finland"],"raw_orcid":"https://orcid.org/0000-0003-2598-8804","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Automation (EEA), Intelligent Robotics Group, Aalto University, Espoo, Finland","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034485872","display_name":"Jan Tommy Gravdahl","orcid":"https://orcid.org/0000-0002-5663-0795"},"institutions":[{"id":"https://openalex.org/I204778367","display_name":"Norwegian University of Science and Technology","ror":"https://ror.org/05xg72x27","country_code":"NO","type":"education","lineage":["https://openalex.org/I204778367"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Jan Tommy Gravdahl","raw_affiliation_strings":["Department of Engineering Cybernetics, Norwegian University of Science and Technology (NTNU), Trondheim, Norway"],"raw_orcid":"https://orcid.org/0000-0002-5663-0795","affiliations":[{"raw_affiliation_string":"Department of Engineering Cybernetics, Norwegian University of Science and Technology (NTNU), Trondheim, Norway","institution_ids":["https://openalex.org/I204778367"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017337432","display_name":"Fares J. Abu\u2010Dakka","orcid":"https://orcid.org/0000-0001-9062-9416"},"institutions":[{"id":"https://openalex.org/I162361429","display_name":"Mondragon Unibertsitatea","ror":"https://ror.org/00wvqgd19","country_code":"ES","type":"education","lineage":["https://openalex.org/I162361429"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Fares J. Abu-Dakka","raw_affiliation_strings":["Department of Electronic and Informatics, Faculty of Engineering, Mondragon University, Arrasate, Spain","Electronic and Informatics Department, Faculty of Engineering, Mondragon Unibertsitatea, Arrasate, Spain"],"raw_orcid":"https://orcid.org/0000-0001-9062-9416","affiliations":[{"raw_affiliation_string":"Department of Electronic and Informatics, Faculty of Engineering, Mondragon University, Arrasate, Spain","institution_ids":["https://openalex.org/I162361429"]},{"raw_affiliation_string":"Electronic and Informatics Department, Faculty of Engineering, Mondragon Unibertsitatea, Arrasate, Spain","institution_ids":["https://openalex.org/I162361429"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5046127916"],"corresponding_institution_ids":["https://openalex.org/I204778367"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.8554,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.84190983,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"12","issue":null,"first_page":"15631","last_page":"15641"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.668613851070404},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6642402410507202},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.47891175746917725},{"id":"https://openalex.org/keywords/electrical-impedance","display_name":"Electrical impedance","score":0.4100019335746765},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39701661467552185},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18025881052017212},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09726822376251221},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.0883902907371521}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.668613851070404},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6642402410507202},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.47891175746917725},{"id":"https://openalex.org/C17829176","wikidata":"https://www.wikidata.org/wiki/Q179043","display_name":"Electrical impedance","level":2,"score":0.4100019335746765},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39701661467552185},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18025881052017212},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09726822376251221},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0883902907371521},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/access.2024.3355311","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3355311","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10401924.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:ebiltegia.mondragon.edu:20.500.11984/6359","is_oa":true,"landing_page_url":"https://katalogoa.mondragon.edu/janium-bin/janium_login_opac.pl?find&amp;ficha_no=174317","pdf_url":null,"source":{"id":"https://openalex.org/S4377196532","display_name":"eRepository Mondragon University (Mondragon University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I162361429","host_organization_name":"Mondragon Unibertsitatea","host_organization_lineage":["https://openalex.org/I162361429"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access Vol 12","raw_type":""},{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/126678","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/1378c5fa-26f0-4ede-93d4-bbb29f52f0fd","pdf_url":null,"source":{"id":"https://openalex.org/S4306401662","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"},{"id":"pmh:oai:doaj.org/article:1e0d71a81c084173882f960d0a067b18","is_oa":true,"landing_page_url":"https://doaj.org/article/1e0d71a81c084173882f960d0a067b18","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 15631-15641 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3355311","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3355311","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10401924.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G3167903563","display_name":null,"funder_award_id":"270941","funder_id":"https://openalex.org/F4320323299","funder_display_name":"Norges Forskningsr\u00e5d"},{"id":"https://openalex.org/G3761947859","display_name":null,"funder_award_id":"Proflow KK-2022/00024","funder_id":"https://openalex.org/F4320321705","funder_display_name":"Eusko Jaurlaritza"},{"id":"https://openalex.org/G4185420230","display_name":null,"funder_award_id":"KK-2023/00055","funder_id":"https://openalex.org/F4320321705","funder_display_name":"Eusko Jaurlaritza"},{"id":"https://openalex.org/G5403502131","display_name":null,"funder_award_id":"HELDU KK-2023/00055","funder_id":"https://openalex.org/F4320321705","funder_display_name":"Eusko Jaurlaritza"}],"funders":[{"id":"https://openalex.org/F4320321705","display_name":"Eusko Jaurlaritza","ror":"https://ror.org/00pz2fp31"},{"id":"https://openalex.org/F4320323299","display_name":"Norges Forskningsr\u00e5d","ror":"https://ror.org/00epmv149"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390939340.pdf","grobid_xml":"https://content.openalex.org/works/W4390939340.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W779291494","https://openalex.org/W1500588313","https://openalex.org/W1575312501","https://openalex.org/W1892385946","https://openalex.org/W1974849157","https://openalex.org/W1978023077","https://openalex.org/W2063182199","https://openalex.org/W2078763164","https://openalex.org/W2097263684","https://openalex.org/W2100235553","https://openalex.org/W2104578628","https://openalex.org/W2112036188","https://openalex.org/W2112474089","https://openalex.org/W2124267516","https://openalex.org/W2126319939","https://openalex.org/W2133932631","https://openalex.org/W2139704669","https://openalex.org/W2156106639","https://openalex.org/W2296438681","https://openalex.org/W2604382266","https://openalex.org/W2604883922","https://openalex.org/W2885700861","https://openalex.org/W2909404881","https://openalex.org/W2950574370","https://openalex.org/W2954337773","https://openalex.org/W3000615405","https://openalex.org/W3003524200","https://openalex.org/W3003629310","https://openalex.org/W3012211643","https://openalex.org/W3028308378","https://openalex.org/W3044718039","https://openalex.org/W3081200565","https://openalex.org/W3100172161","https://openalex.org/W3101875589","https://openalex.org/W3115157241","https://openalex.org/W3202864130","https://openalex.org/W4205658840","https://openalex.org/W4211049957","https://openalex.org/W4221120003","https://openalex.org/W4250391287","https://openalex.org/W4287331155","https://openalex.org/W4324106947","https://openalex.org/W4387007853","https://openalex.org/W6680657880","https://openalex.org/W6680987236","https://openalex.org/W6702989015","https://openalex.org/W6771484861","https://openalex.org/W6790607543","https://openalex.org/W6790844918","https://openalex.org/W7048497977"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109"],"abstract_inverted_index":{"One":[0],"of":[1,109,132,238],"the":[2,18,25,39,66,72,102,110,125,136,153,158,162,168,178,211,231,239,244],"most":[3],"crucial":[4],"steps":[5],"toward":[6,223],"achieving":[7],"human-like":[8],"manipulation":[9,208,227],"skills":[10,228],"in":[11,81,120,210,230,243],"robots":[12],"is":[13,143,164,219,241],"to":[14,51,78,100,146,167,176],"incorporate":[15],"compliance":[16,54,67],"into":[17],"robot":[19,50,126,175],"controller.":[20],"Compliance":[21],"not":[22],"only":[23,182],"makes":[24,31],"robot\u2019s":[26,154],"behaviour":[27],"safe":[28],"but":[29],"also":[30],"it":[32,187],"more":[33],"energy":[34],"efficient.":[35],"In":[36,83,192],"this":[37,84],"direction,":[38],"variable":[40,103],"impedance":[41,61,104,155],"control":[42],"(VIC)":[43],"approach":[44,92,119],"provides":[45],"a":[46,49,75,88,116,129,148,174,183,200,220],"framework":[47],"for":[48,161,189,206],"adapt":[52],"its":[53,133],"during":[55],"execution":[56],"by":[57,71],"employing":[58],"an":[59],"adaptive":[60],"law.":[62],"Nevertheless,":[63],"autonomously":[64,224],"adapting":[65],"profile":[68],"as":[69],"demanded":[70],"task":[73,163],"remains":[74],"challenging":[76],"problem":[77],"be":[79],"solved":[80],"practice.":[82],"work,":[85],"we":[86,114,196],"introduce":[87],"reinforcement":[89],"learning":[90,225],"(RL)-based":[91],"called":[93],"DEVILC":[94,172,198,218],"(Data-Efficient":[95],"Variable":[96],"Impedance":[97],"Learning":[98],"Controller)":[99],"learn":[101,177],"controller":[105],"through":[106,234],"real-world":[107,190],"interaction":[108],"robot.":[111],"More":[112],"concretely,":[113],"use":[115],"model-based":[117,169],"RL":[118,170],"which,":[121],"after":[122],"every":[123],"interaction,":[124],"iteratively":[127],"learns":[128],"probabilistic":[130],"model":[131,142],"dynamics":[134],"using":[135],"Gaussian":[137],"process":[138],"regression":[139],"model.":[140],"The":[141,214],"then":[144],"used":[145],"optimize":[147],"neural-network":[149],"policy":[150,180],"that":[151,157,217],"modulates":[152],"such":[156],"long-term":[159],"reward":[160],"maximized.":[165],"Thanks":[166],"framework,":[171],"allows":[173],"VIC":[179],"with":[181],"few":[184],"interactions,":[185],"making":[186],"practical":[188],"applications.":[191],"simulations":[193],"and":[194],"experiments,":[195],"evaluate":[197],"on":[199],"Franka":[201],"Emika":[202],"Panda":[203],"robotic":[204],"manipulator":[205],"different":[207],"tasks":[209],"Cartesian":[212],"space.":[213],"results":[215],"show":[216],"promising":[221],"direction":[222],"compliant":[226],"directly":[229],"real":[232],"world":[233],"interactions.":[235],"A":[236],"video":[237],"experiments":[240],"available":[242],"link:":[245],"https://youtu.be/_uyr0Vye5no":[246]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
