{"id":"https://openalex.org/W2958619454","doi":"https://doi.org/10.1109/lra.2020.3011379","title":"Learning Variable Impedance Control for Contact Sensitive Tasks","display_name":"Learning Variable Impedance Control for Contact Sensitive Tasks","publication_year":2020,"publication_date":"2020-07-23","ids":{"openalex":"https://openalex.org/W2958619454","doi":"https://doi.org/10.1109/lra.2020.3011379","mag":"2958619454"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2020.3011379","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3011379","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1907.07500","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032586525","display_name":"Miroslav Bogdanovi\u0107","orcid":"https://orcid.org/0000-0001-7255-7658"},"institutions":[{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Miroslav Bogdanovic","raw_affiliation_strings":["Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","[Max-Planck Institute for Intelligent Systems, Tubingen, Germany]"],"raw_orcid":"https://orcid.org/0000-0001-7255-7658","affiliations":[{"raw_affiliation_string":"Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I4210135521"]},{"raw_affiliation_string":"[Max-Planck Institute for Intelligent Systems, Tubingen, Germany]","institution_ids":["https://openalex.org/I4210135521"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043216529","display_name":"Majid Khadiv","orcid":"https://orcid.org/0000-0001-9889-6543"},"institutions":[{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Majid Khadiv","raw_affiliation_strings":["Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","[Max-Planck Institute for Intelligent Systems, Tubingen, Germany]"],"raw_orcid":"https://orcid.org/0000-0001-9889-6543","affiliations":[{"raw_affiliation_string":"Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I4210135521"]},{"raw_affiliation_string":"[Max-Planck Institute for Intelligent Systems, Tubingen, Germany]","institution_ids":["https://openalex.org/I4210135521"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026007843","display_name":"Ludovic Righetti","orcid":"https://orcid.org/0000-0002-6458-9112"},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]},{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Ludovic Righetti","raw_affiliation_strings":["Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","Tandon School of Engineering, New York University, New York, USA","Max-Planck-Society"],"raw_orcid":"https://orcid.org/0000-0002-6458-9112","affiliations":[{"raw_affiliation_string":"Max-Planck Institute for Intelligent Systems, T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I4210135521"]},{"raw_affiliation_string":"Tandon School of Engineering, New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]},{"raw_affiliation_string":"Max-Planck-Society","institution_ids":["https://openalex.org/I149899117"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5032586525"],"corresponding_institution_ids":["https://openalex.org/I4210135521"],"apc_list":null,"apc_paid":null,"fwci":0.5951,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65451078,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"5","issue":"4","first_page":"6129","last_page":"6136"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8653686046600342},{"id":"https://openalex.org/keywords/impedance-control","display_name":"Impedance control","score":0.7927099466323853},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6625306010246277},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6384725570678711},{"id":"https://openalex.org/keywords/torque","display_name":"Torque","score":0.5676347017288208},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.5579288005828857},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.5437880158424377},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.5139910578727722},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5113248229026794},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5111387372016907},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4869714677333832},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.47314441204071045},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.459827184677124},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.40107738971710205},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3363885283470154},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.175441712141037},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14321252703666687}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8653686046600342},{"id":"https://openalex.org/C2777984285","wikidata":"https://www.wikidata.org/wiki/Q17098134","display_name":"Impedance control","level":3,"score":0.7927099466323853},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6625306010246277},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6384725570678711},{"id":"https://openalex.org/C144171764","wikidata":"https://www.wikidata.org/wiki/Q48103","display_name":"Torque","level":2,"score":0.5676347017288208},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.5579288005828857},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5437880158424377},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.5139910578727722},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5113248229026794},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5111387372016907},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4869714677333832},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.47314441204071045},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.459827184677124},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.40107738971710205},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3363885283470154},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.175441712141037},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14321252703666687},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/lra.2020.3011379","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3011379","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1907.07500","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.07500","pdf_url":"https://arxiv.org/pdf/1907.07500","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.1907.07500","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1907.07500","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2958619454","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1907.07500","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.07500","pdf_url":"https://arxiv.org/pdf/1907.07500","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2958619454.pdf","grobid_xml":"https://content.openalex.org/works/W2958619454.grobid-xml"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W1499277207","https://openalex.org/W1978023077","https://openalex.org/W2061350632","https://openalex.org/W2064173399","https://openalex.org/W2068923975","https://openalex.org/W2100235553","https://openalex.org/W2125602005","https://openalex.org/W2133932631","https://openalex.org/W2169187067","https://openalex.org/W2284232578","https://openalex.org/W2517641405","https://openalex.org/W2546975091","https://openalex.org/W2762329249","https://openalex.org/W2767050701","https://openalex.org/W2911087563","https://openalex.org/W2919187111","https://openalex.org/W2949275450","https://openalex.org/W2949658140","https://openalex.org/W2963864421","https://openalex.org/W2968268581","https://openalex.org/W2977389550","https://openalex.org/W3003524200","https://openalex.org/W3003629310","https://openalex.org/W3007035358","https://openalex.org/W3101442004","https://openalex.org/W3101870171","https://openalex.org/W3105320065","https://openalex.org/W3151089333","https://openalex.org/W4300892751","https://openalex.org/W6684921986"],"related_works":["https://openalex.org/W3105320065","https://openalex.org/W3093541907","https://openalex.org/W2999490157","https://openalex.org/W2968021416","https://openalex.org/W2399469065","https://openalex.org/W1555368087","https://openalex.org/W2513373085","https://openalex.org/W2895958971","https://openalex.org/W2919334316","https://openalex.org/W3024554557","https://openalex.org/W2735268712","https://openalex.org/W2953082648","https://openalex.org/W2100370041","https://openalex.org/W2796496570","https://openalex.org/W2944714385","https://openalex.org/W1965226337","https://openalex.org/W2565122071","https://openalex.org/W2985871261","https://openalex.org/W2569873438","https://openalex.org/W23935843"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,92],"algorithms":[2],"have":[3],"shown":[4],"great":[5],"success":[6],"in":[7,32,49,66,85,102,150,158],"solving":[8],"different":[9,118],"problems":[10],"ranging":[11],"from":[12],"playing":[13],"video":[14],"games":[15],"to":[16,21,43,45,57,112,129,143],"robotics.":[17],"However,":[18],"they":[19],"struggle":[20],"solve":[22,59],"delicate":[23],"robotic":[24],"problems,":[25],"especially":[26],"those":[27],"involving":[28,160],"contact":[29,88,119,161],"interactions.":[30],"Though":[31],"principle":[33],"a":[34,93,173],"policy":[35,94],"directly":[36],"outputting":[37],"joint":[38,103],"torques":[39],"should":[40],"be":[41,179],"able":[42],"learn":[44],"perform":[46],"these":[47,131],"tasks,":[48],"practice":[50],"we":[51,73,122],"see":[52],"that":[53,110],"it":[54],"has":[55],"difficulty":[56],"robustly":[58],"the":[60,67,76,107,169],"problem":[61],"without":[62],"any":[63],"given":[64],"structure":[65],"action":[68,79],"space.":[69],"In":[70],"this":[71],"letter,":[72],"investigate":[74],"how":[75],"choice":[77],"of":[78,87,109,152],"space":[80,104],"can":[81,178],"give":[82],"robust":[83],"performance":[84,108],"presence":[86],"uncertainties.":[89,120],"We":[90,146],"propose":[91,123],"giving":[95,136],"as":[96,163,165],"output":[97],"impedance":[98,133],"and":[99,105,114,139,155],"desired":[100],"position":[101,115],"compare":[106],"approach":[111],"torque":[113],"control":[116,134],"under":[117],"Furthermore,":[121],"an":[124],"additional":[125],"reward":[126],"term":[127],"designed":[128],"regularize":[130],"variable":[132],"policies,":[135],"them":[137],"interpretability":[138],"facilitating":[140],"their":[141],"transfer":[142],"real":[144,174],"systems.":[145],"present":[147],"extensive":[148],"experiments":[149],"simulation":[151],"both":[153],"floating":[154],"fixed-base":[156],"systems":[157],"tasks":[159],"uncertainties,":[162],"well":[164],"results":[166],"for":[167],"running":[168],"learned":[170],"policies":[171],"on":[172],"system":[175],"(accompanying":[176],"videos":[177],"seen":[180],"here:":[181],"https://youtu.be/AQuuQ-h4dBM).":[182]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
