{"id":"https://openalex.org/W4312301659","doi":"https://doi.org/10.1109/iros47612.2022.9981810","title":"Reshaping Robot Trajectories Using Natural Language Commands: A Study of Multi-Modal Data Alignment Using Transformers","display_name":"Reshaping Robot Trajectories Using Natural Language Commands: A Study of Multi-Modal Data Alignment Using Transformers","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W4312301659","doi":"https://doi.org/10.1109/iros47612.2022.9981810"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9981810","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981810","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089730590","display_name":"Arthur Bucker","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Arthur Bucker","raw_affiliation_strings":["Technische Universit&#x00E4;t M&#x00FC;nchen"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t M&#x00FC;nchen","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040790541","display_name":"Luis Figueredo","orcid":"https://orcid.org/0000-0002-0759-3000"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luis Figueredo","raw_affiliation_strings":["Technische Universit&#x00E4;t M&#x00FC;nchen"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t M&#x00FC;nchen","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009345502","display_name":"Sami Haddadinl","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sami Haddadinl","raw_affiliation_strings":["Technische Universit&#x00E4;t M&#x00FC;nchen"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t M&#x00FC;nchen","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046810768","display_name":"Ashish Kapoor","orcid":"https://orcid.org/0000-0002-4686-394X"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ashish Kapoor","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100529011","display_name":"Shuang Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Shuang Ma","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062522127","display_name":"Rogerio Bonatti","orcid":"https://orcid.org/0000-0003-3015-9613"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Rogerio Bonatti","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5089730590"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2702,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.92015614,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"978","last_page":"984"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8300143480300903},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.6394291520118713},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5700693130493164},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5275698900222778},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.47794631123542786},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4721265733242035},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.45229730010032654},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.43965643644332886},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.42653968930244446},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.4114443063735962},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10816437005996704}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8300143480300903},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.6394291520118713},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5700693130493164},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5275698900222778},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.47794631123542786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4721265733242035},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.45229730010032654},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.43965643644332886},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.42653968930244446},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.4114443063735962},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10816437005996704},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.0},{"id":"https://openalex.org/C129307140","wikidata":"https://www.wikidata.org/wiki/Q6795880","display_name":"Maximum bubble pressure method","level":3,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros47612.2022.9981810","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981810","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:mediatum.ub.tum.de:node/1700074","is_oa":false,"landing_page_url":"https://mediatum.ub.tum.de/1700074","pdf_url":null,"source":{"id":"https://openalex.org/S4377196330","display_name":"mediaTUM  (Technical University of Munich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I62916508","host_organization_name":"Technical University of Munich","host_organization_lineage":["https://openalex.org/I62916508"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"ConferencePaper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5699999928474426,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1424654272","https://openalex.org/W1602500555","https://openalex.org/W2003331882","https://openalex.org/W2073787051","https://openalex.org/W2099893201","https://openalex.org/W2295357975","https://openalex.org/W2896457183","https://openalex.org/W2914112028","https://openalex.org/W2962744691","https://openalex.org/W2963800628","https://openalex.org/W2966715458","https://openalex.org/W2969876226","https://openalex.org/W2970340522","https://openalex.org/W2981851019","https://openalex.org/W2990408345","https://openalex.org/W2995435108","https://openalex.org/W2997591391","https://openalex.org/W3003205975","https://openalex.org/W3033090297","https://openalex.org/W3034500398","https://openalex.org/W3098201885","https://openalex.org/W3109097593","https://openalex.org/W3160050461","https://openalex.org/W3165533860","https://openalex.org/W3167645943","https://openalex.org/W3169291081","https://openalex.org/W3175995235","https://openalex.org/W3176484337","https://openalex.org/W3195577433","https://openalex.org/W3206641383","https://openalex.org/W3207832698","https://openalex.org/W3212977909","https://openalex.org/W3215626407","https://openalex.org/W4221152848","https://openalex.org/W4221167110","https://openalex.org/W4249736682","https://openalex.org/W4287112297","https://openalex.org/W4287126489","https://openalex.org/W4292779060","https://openalex.org/W4312289535","https://openalex.org/W4385245566","https://openalex.org/W6636408305","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6759380828","https://openalex.org/W6762287338","https://openalex.org/W6765527290","https://openalex.org/W6766904570","https://openalex.org/W6767211374","https://openalex.org/W6770805772","https://openalex.org/W6778883912","https://openalex.org/W6780226713","https://openalex.org/W6784155536","https://openalex.org/W6791353385","https://openalex.org/W6796289742","https://openalex.org/W6796420931","https://openalex.org/W6797065961","https://openalex.org/W6800751262","https://openalex.org/W6801810553","https://openalex.org/W6803872405","https://openalex.org/W6803939559","https://openalex.org/W6804244202","https://openalex.org/W6809509765","https://openalex.org/W6810296985"],"related_works":["https://openalex.org/W4390722570","https://openalex.org/W4288263119","https://openalex.org/W3015724364","https://openalex.org/W3094085917","https://openalex.org/W2967994095","https://openalex.org/W4287631637","https://openalex.org/W3099576124","https://openalex.org/W4285240985","https://openalex.org/W2900126711","https://openalex.org/W4286930972"],"abstract_inverted_index":{"Natural":[0],"language":[1,21,41,90,127,143,184,210],"is":[2,22],"the":[3,39,86,97,114,131,149,200],"most":[4,37],"intuitive":[5,215],"medium":[6],"for":[7,64,75],"us":[8],"to":[9,30,71,95,141],"interact":[10],"with":[11,46,105,173],"other":[12],"people":[13],"when":[14,27],"expressing":[15],"commands":[16],"and":[17,53,93,100,129,156,219],"instructions.":[18],"However,":[19],"using":[20,108,116],"seldom":[23],"an":[24,76],"easy":[25],"task":[26],"humans":[28],"need":[29],"express":[31],"their":[32],"intent":[33],"towards":[34,212],"robots,":[35],"since":[36],"of":[38,50,82,88,162,202,207],"current":[40],"interfaces":[42,216],"require":[43],"rigid":[44],"templates":[45],"a":[47,60,69,120,136,158,174],"static":[48],"set":[49],"action":[51],"targets":[52],"commands.":[54],"In":[55,168],"this":[56],"work,":[57],"we":[58],"provide":[59],"flexible":[61],"language-based":[62],"interface":[63,185],"human-robot":[65],"collaboration,":[66],"which":[67],"allows":[68],"user":[70,98],"reshape":[72],"existing":[73],"trajectories":[74,124],"autonomous":[77],"agent.":[78],"We":[79,112,147],"take":[80,205],"advantage":[81,206],"recent":[83],"advancements":[84],"in":[85,151],"field":[87,201],"large":[89,208],"models":[91,211],"(BERT":[92],"CLIP)":[94],"encode":[96],"command,":[99],"then":[101],"combine":[102],"these":[103],"features":[104],"trajectory":[106,132,154],"information":[107],"multi-modal":[109],"attention":[110],"transformers.":[111],"train":[113],"model":[115,164],"imitation":[117],"learning":[118],"over":[119,165,186],"dataset":[121],"containing":[122],"robot":[123,175],"modified":[125],"by":[126],"commands,":[128],"treat":[130],"generation":[133,144],"process":[134],"as":[135,190],"sequence":[137],"prediction":[138],"problem,":[139],"analogously":[140],"how":[142,199],"architectures":[145],"operate.":[146],"evaluate":[148],"system":[150],"multiple":[152],"simulated":[153],"scenarios,":[155],"show":[157,177],"significant":[159],"performance":[160],"increase":[161],"our":[163,170,182],"baseline":[166],"approaches.":[167],"addition,":[169],"real-world":[171],"experiments":[172],"arm":[176],"that":[178],"users":[179],"significantly":[180],"prefer":[181],"natural":[183],"traditional":[187],"methods":[188],"such":[189],"kinesthetic":[191],"teaching":[192],"or":[193],"cost-function":[194],"programming.":[195],"Our":[196],"study":[197],"shows":[198],"robotics":[203],"can":[204],"pre-trained":[209],"creating":[213],"more":[214],"between":[217],"robots":[218],"machines.":[220],"Project":[221],"webpage:":[222],"https://arthurfenderbucker.github.io/NL_trajectory_reshaper/":[223]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
