{"id":"https://openalex.org/W4280630155","doi":"https://doi.org/10.1109/icra46639.2022.9812376","title":"Disturbance-injected Robust Imitation Learning with Task Achievement","display_name":"Disturbance-injected Robust Imitation Learning with Task Achievement","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4280630155","doi":"https://doi.org/10.1109/icra46639.2022.9812376"},"language":"en","primary_location":{"id":"doi:10.1109/icra46639.2022.9812376","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812376","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081093202","display_name":"Hirotaka Tahara","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirotaka Tahara","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007321577","display_name":"Hikaru Sasaki","orcid":"https://orcid.org/0000-0001-7380-1931"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hikaru Sasaki","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084521287","display_name":"Hanbit Oh","orcid":"https://orcid.org/0009-0000-8024-9778"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hanbit Oh","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064634210","display_name":"Brendan Michael","orcid":"https://orcid.org/0000-0002-5631-9913"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Brendan Michael","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042074952","display_name":"Takamitsu Matsubara","orcid":"https://orcid.org/0000-0003-3545-4814"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takamitsu Matsubara","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology,Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.806,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.92211713,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2466","last_page":"2472"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustification","display_name":"Robustification","score":0.7712154388427734},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.7676866054534912},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6881375908851624},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6841378808021545},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6018131971359253},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5401723384857178},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5119855999946594},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.49743011593818665},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.49336734414100647},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.45583653450012207},{"id":"https://openalex.org/keywords/disturbance","display_name":"Disturbance (geology)","score":0.45162928104400635},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44020533561706543},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14831414818763733}],"concepts":[{"id":"https://openalex.org/C2778584072","wikidata":"https://www.wikidata.org/wiki/Q7353545","display_name":"Robustification","level":3,"score":0.7712154388427734},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.7676866054534912},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6881375908851624},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6841378808021545},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6018131971359253},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5401723384857178},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5119855999946594},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.49743011593818665},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.49336734414100647},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.45583653450012207},{"id":"https://openalex.org/C2777601987","wikidata":"https://www.wikidata.org/wiki/Q5283581","display_name":"Disturbance (geology)","level":2,"score":0.45162928104400635},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44020533561706543},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14831414818763733},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra46639.2022.9812376","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812376","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G811202408","display_name":null,"funder_award_id":"JPMJMS2032","funder_id":"https://openalex.org/F4320320907","funder_display_name":"Japan Science and Technology Corporation"}],"funders":[{"id":"https://openalex.org/F4320320907","display_name":"Japan Science and Technology Corporation","ror":"https://ror.org/00097mb19"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1479682106","https://openalex.org/W1845972764","https://openalex.org/W1931877416","https://openalex.org/W2051228319","https://openalex.org/W2071841410","https://openalex.org/W2109169869","https://openalex.org/W2121490003","https://openalex.org/W2135043890","https://openalex.org/W2142641780","https://openalex.org/W2171054284","https://openalex.org/W2403171414","https://openalex.org/W2574076163","https://openalex.org/W2597234992","https://openalex.org/W2952691404","https://openalex.org/W2952996256","https://openalex.org/W2963669336","https://openalex.org/W2964120017","https://openalex.org/W3035366536","https://openalex.org/W3036472058","https://openalex.org/W3037625705","https://openalex.org/W3049481978","https://openalex.org/W3093784762","https://openalex.org/W3100789280","https://openalex.org/W3101780148","https://openalex.org/W3129803046","https://openalex.org/W3132694240","https://openalex.org/W3168354865","https://openalex.org/W3205195733","https://openalex.org/W4288284400","https://openalex.org/W6639175102","https://openalex.org/W6640174482","https://openalex.org/W6680724558","https://openalex.org/W6747311492","https://openalex.org/W6759312711","https://openalex.org/W6768977950","https://openalex.org/W6769174716","https://openalex.org/W6779370943","https://openalex.org/W6785034342","https://openalex.org/W6791770056"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W3174019841"],"abstract_inverted_index":{"Robust":[0],"imitation":[1,60],"learning":[2,61,78,87],"using":[3,115],"disturbance":[4,39,80],"injections":[5],"overcomes":[6],"issues":[7],"of":[8,36,102,107,145],"limited":[9],"variation":[10],"in":[11,119,127,154],"demonstrations.":[12,138],"However,":[13],"these":[14],"methods":[15],"assume":[16],"demonstrations":[17,33,149],"are":[18,34,131],"optimal,":[19],"and":[20,38,68,79,122,134],"that":[21,45,63,130],"policy":[22,66,77],"stabilization":[23],"can":[24],"be":[25],"learned":[26],"via":[27],"simple":[28],"augmentations.":[29],"In":[30,139],"real-world":[31],"scenarios,":[32],"often":[35],"diverse-quality,":[37],"injection":[40,81],"instead":[41],"learns":[42],"sub-optimal":[43,148],"policies":[44,129],"fail":[46],"to":[47,83,98,136],"replicate":[48],"desired":[49],"behavior.":[50],"To":[51],"address":[52],"this":[53,55,73,141],"issue,":[54],"paper":[56],"proposes":[57],"a":[58,123],"novel":[59],"framework":[62],"combines":[64],"both":[65,120],"robustification":[67],"optimal":[69],"demonstration":[70],"learning.":[71],"Specifically,":[72],"combinatorial":[74],"approach":[75],"forces":[76],"optimization":[82],"focus":[84],"on":[85],"mainly":[86],"from":[88],"high":[89],"task":[90,118],"achievement":[91,96],"demonstrations,":[92],"while":[93],"utilizing":[94],"low":[95],"ones":[97],"decrease":[99],"the":[100,108,146],"number":[101],"samples":[103],"needed.":[104],"The":[105],"effectiveness":[106],"proposed":[109],"method":[110,142],"is":[111],"verified":[112],"through":[113],"experiments":[114],"an":[116],"excavation":[117],"simulations":[121],"real":[124],"robot,":[125],"resulting":[126,153],"high-achieving":[128],"more":[132],"stable":[133],"robust":[135],"diverse-quality":[137],"addition,":[140],"utilizes":[143],"all":[144],"weighted":[147],"without":[150],"eliminating":[151],"them,":[152],"practical":[155],"data":[156],"efficiency":[157],"benefits.":[158]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
