{"id":"https://openalex.org/W4400877404","doi":"https://doi.org/10.1109/tro.2024.3431988","title":"Efficient Deep Learning of Robust Policies From MPC Using Imitation and Tube-Guided Data Augmentation","display_name":"Efficient Deep Learning of Robust Policies From MPC Using Imitation and Tube-Guided Data Augmentation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4400877404","doi":"https://doi.org/10.1109/tro.2024.3431988"},"language":"en","primary_location":{"id":"doi:10.1109/tro.2024.3431988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tro.2024.3431988","pdf_url":null,"source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102712548","display_name":"Andrea Tagliabue","orcid":"https://orcid.org/0000-0003-3376-4114"},"institutions":[{"id":"https://openalex.org/I46020346","display_name":"American Institute of Aeronautics and Astronautics","ror":"https://ror.org/00a1rzv11","country_code":"US","type":"other","lineage":["https://openalex.org/I46020346"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Andrea Tagliabue","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I46020346","https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011665886","display_name":"Jonathan P. How","orcid":"https://orcid.org/0000-0001-8576-1930"},"institutions":[{"id":"https://openalex.org/I46020346","display_name":"American Institute of Aeronautics and Astronautics","ror":"https://ror.org/00a1rzv11","country_code":"US","type":"other","lineage":["https://openalex.org/I46020346"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan P. How","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I46020346","https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102712548"],"corresponding_institution_ids":["https://openalex.org/I46020346","https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":7.3281,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.97762858,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"40","issue":null,"first_page":"4301","last_page":"4321"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9352999925613403,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9352999925613403,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.64308762550354},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6131682395935059},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5316458344459534},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4619600772857666},{"id":"https://openalex.org/keywords/tube","display_name":"Tube (container)","score":0.43964022397994995},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32357025146484375},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.26285699009895325},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.18526864051818848},{"id":"https://openalex.org/keywords/mechanical-engineering","display_name":"Mechanical engineering","score":0.09888318181037903}],"concepts":[{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.64308762550354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6131682395935059},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5316458344459534},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4619600772857666},{"id":"https://openalex.org/C2777551473","wikidata":"https://www.wikidata.org/wiki/Q2093072","display_name":"Tube (container)","level":2,"score":0.43964022397994995},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32357025146484375},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.26285699009895325},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.18526864051818848},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.09888318181037903},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tro.2024.3431988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tro.2024.3431988","pdf_url":null,"source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"id":"https://metadata.un.org/sdg/2","display_name":"Zero hunger"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":83,"referenced_works":["https://openalex.org/W195033972","https://openalex.org/W1522301498","https://openalex.org/W1763790326","https://openalex.org/W1873756947","https://openalex.org/W1923344279","https://openalex.org/W1977164425","https://openalex.org/W1980969546","https://openalex.org/W1981723834","https://openalex.org/W2025752438","https://openalex.org/W2043837315","https://openalex.org/W2066425650","https://openalex.org/W2080407798","https://openalex.org/W2093187605","https://openalex.org/W2117402460","https://openalex.org/W2163045496","https://openalex.org/W2167224731","https://openalex.org/W2342840547","https://openalex.org/W2410617946","https://openalex.org/W2559336140","https://openalex.org/W2618092744","https://openalex.org/W2749680651","https://openalex.org/W2758653969","https://openalex.org/W2767050701","https://openalex.org/W2768748954","https://openalex.org/W2769646558","https://openalex.org/W2907380995","https://openalex.org/W2925761457","https://openalex.org/W2963966702","https://openalex.org/W2964070888","https://openalex.org/W2968116426","https://openalex.org/W2972830116","https://openalex.org/W2972864268","https://openalex.org/W2979863294","https://openalex.org/W2982095652","https://openalex.org/W2997406364","https://openalex.org/W3033405912","https://openalex.org/W3038825904","https://openalex.org/W3039984786","https://openalex.org/W3095839831","https://openalex.org/W3097841467","https://openalex.org/W3100238596","https://openalex.org/W3100769368","https://openalex.org/W3101442004","https://openalex.org/W3101780148","https://openalex.org/W3101798601","https://openalex.org/W3102552342","https://openalex.org/W3105570727","https://openalex.org/W3107452320","https://openalex.org/W3130833653","https://openalex.org/W3148417208","https://openalex.org/W3155272911","https://openalex.org/W3158675508","https://openalex.org/W3181621367","https://openalex.org/W3185165122","https://openalex.org/W3197225143","https://openalex.org/W3201459714","https://openalex.org/W3207305612","https://openalex.org/W3208705304","https://openalex.org/W3212975979","https://openalex.org/W3217056046","https://openalex.org/W4205550208","https://openalex.org/W4206101760","https://openalex.org/W4214717370","https://openalex.org/W4285163488","https://openalex.org/W4286372820","https://openalex.org/W4306850145","https://openalex.org/W4312187283","https://openalex.org/W4313679833","https://openalex.org/W4364322337","https://openalex.org/W4379116938","https://openalex.org/W4386718967","https://openalex.org/W6631190155","https://openalex.org/W6640174482","https://openalex.org/W6675999342","https://openalex.org/W6684338915","https://openalex.org/W6704559304","https://openalex.org/W6747311492","https://openalex.org/W6757304564","https://openalex.org/W6772071412","https://openalex.org/W6784826119","https://openalex.org/W6800464454","https://openalex.org/W6855355228","https://openalex.org/W7065631163"],"related_works":["https://openalex.org/W2731899572","https://openalex.org/W3215138031","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3009238340","https://openalex.org/W3116076068","https://openalex.org/W2229312674"],"abstract_inverted_index":{"Imitation":[0],"learning":[1],"(IL)":[2],"can":[3],"generate":[4,117],"computationally":[5,58,96],"efficient":[6,97],"policies":[7,37],"from":[8,91,135],"demonstrations":[9,111],"provided":[10],"by":[11],"model":[12,164],"predictive":[13],"control":[14],"(MPC).":[15],"However,":[16],"IL":[17,50,189],"methods":[18,100],"often":[19],"require":[20],"extensive":[21],"data-collection":[22],"and":[23,34,88,112,171,193,202,214],"training-efforts,":[24],"limiting":[25],"changes":[26],"to":[27,41,52,72,116,156,204],"the":[28,31,82,92,107,124,212],"policy":[29,66,133],"if":[30],"task":[32],"changes,":[33],"they":[35],"produce":[36],"with":[38,160],"limited":[39],"robustness":[40,203],"new":[42,158],"disturbances.":[43,75],"In":[44],"this":[45],"work,":[46],"we":[47,94],"propose":[48],"an":[49],"strategy":[51],"<italic":[53,69,127],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[54,70,128],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">efficiently</i>":[55],"compress":[56],"a":[57,62,78,103,118,132,136,142,147,150,153,157,178],"expensive":[59],"MPC":[60,110,138,173],"into":[61],"deep":[63],"neural":[64],"network":[65],"that":[67,101,181],"is":[68],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">robust</i>":[71],"previously":[73,161],"unseen":[74,162,206],"By":[76],"using":[77,169],"robust":[79,85,119],"variant":[80],"of":[81,106,109,126,131,198],"MPC,":[83,87],"called":[84],"tube":[86],"leveraging":[89],"properties":[90],"controller,":[93],"introduce":[95],"data":[98],"augmentation":[99],"enable":[102],"significant":[104],"reduction":[105],"number":[108],"training":[113,200],"efforts":[114],"required":[115],"policy.":[120],"Our":[121],"approach":[122],"opens":[123],"possibility":[125],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">zero-shot</i>":[129],"transfer":[130],"trained":[134],"single":[137],"demonstration":[139],"collected":[140],"in":[141,152,188,196],"nominal":[143],"domain,":[144],"such":[145],"as":[146,191],"simulation":[148],"or":[149],"robot":[151],"lab/controlled":[154],"environment,":[155],"domain":[159,194],"bounded":[163],"errors/perturbations.":[165],"Numerical":[166],"evaluations":[167,210],"performed":[168],"linear":[170],"nonlinear":[172],"for":[174],"agile":[175],"flight":[176],"on":[177],"multirotor":[179],"show":[180],"our":[182],"method":[183],"outperforms":[184],"strategies":[185],"commonly":[186],"employed":[187],"(such":[190],"dataset-aggregation":[192],"randomization)":[195],"terms":[197],"demonstration-efficiency,":[199],"time,":[201],"perturbations":[205],"during":[207],"training.":[208],"Experimental":[209],"validate":[211],"efficiency":[213],"real-world":[215],"robustness.":[216]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":1}],"updated_date":"2026-02-25T23:00:34.991745","created_date":"2025-10-10T00:00:00"}
