{"id":"https://openalex.org/W4402968400","doi":"https://doi.org/10.1109/lra.2024.3471457","title":"ReplanVLM: Replanning Robotic Tasks With Visual Language Models","display_name":"ReplanVLM: Replanning Robotic Tasks With Visual Language Models","publication_year":2024,"publication_date":"2024-09-30","ids":{"openalex":"https://openalex.org/W4402968400","doi":"https://doi.org/10.1109/lra.2024.3471457"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2024.3471457","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3471457","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5105820351","display_name":"Aoran Mei","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aoran Mei","raw_affiliation_strings":["Academy for Engineering and Technology, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0002-6737-8983","affiliations":[{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050027236","display_name":"Guo\u2010Niu Zhu","orcid":"https://orcid.org/0000-0003-2421-740X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guo-Niu Zhu","raw_affiliation_strings":["Academy for Engineering and Technology, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-2421-740X","affiliations":[{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Huaxiang Zhang","orcid":"https://orcid.org/0009-0002-4175-7547"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaxiang Zhang","raw_affiliation_strings":["Academy for Engineering and Technology, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0002-4175-7547","affiliations":[{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103131528","display_name":"Zhongxue Gan","orcid":"https://orcid.org/0000-0003-1365-396X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongxue Gan","raw_affiliation_strings":["Academy for Engineering and Technology, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-1365-396X","affiliations":[{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":7.7128,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.98248305,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"9","issue":"11","first_page":"10201","last_page":"10208"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9678000211715698,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9459999799728394,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.670323371887207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5006630420684814},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.48982712626457214},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.34677132964134216},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.34553152322769165},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2690550684928894}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.670323371887207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5006630420684814},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.48982712626457214},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.34677132964134216},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34553152322769165},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2690550684928894}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2024.3471457","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3471457","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W4224912544","https://openalex.org/W4383108457","https://openalex.org/W4388720459","https://openalex.org/W4389665575","https://openalex.org/W4389665836","https://openalex.org/W4389666115","https://openalex.org/W4390099597","https://openalex.org/W4391678022","https://openalex.org/W4392517027","https://openalex.org/W4393160795","https://openalex.org/W4401415710","https://openalex.org/W4401417048","https://openalex.org/W4401687172","https://openalex.org/W6851513886","https://openalex.org/W6852253340","https://openalex.org/W6853111285","https://openalex.org/W6854929498","https://openalex.org/W6856817465","https://openalex.org/W6857785731","https://openalex.org/W6858576426","https://openalex.org/W6859297042","https://openalex.org/W6860060064"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Large":[0],"language":[1,66],"models":[2,67],"(LLMs)":[3],"have":[4,40,174],"gained":[5],"increasing":[6],"popularity":[7],"in":[8,17,35,171,191],"robotic":[9,83,118],"task":[10,84,98,119,162],"planning":[11],"due":[12],"to":[13,49,143,154],"their":[14,25],"exceptional":[15],"abilities":[16],"text":[18],"analytics":[19],"and":[20,135,170,186],"generation,":[21],"as":[22,24,94],"well":[23],"broad":[26],"knowledge":[27],"of":[28,44,53,57,64,82,178],"the":[29,45,54,58,62,80,95,176,179],"world.":[30,59],"However,":[31],"they":[32],"fall":[33],"short":[34],"decoding":[36],"visual":[37,65,74],"cues.":[38],"LLMs":[39],"limited":[41],"direct":[42],"perception":[43,75],"world,":[46],"which":[47,77],"leads":[48],"a":[50,114],"deficient":[51],"grasp":[52],"current":[55],"state":[56],"By":[60],"contrast,":[61],"emergence":[63],"(VLMs)":[68],"fills":[69],"this":[70,111,122],"gap":[71],"by":[72],"integrating":[73],"modules,":[76],"can":[78],"enhance":[79],"autonomy":[81],"planning.":[85,120],"Despite":[86],"these":[87],"advancements,":[88],"VLMs":[89],"still":[90],"face":[91],"challenges,":[92],"such":[93,109],"potential":[96],"for":[97,117],"execution":[99,163],"errors,":[100],"even":[101],"when":[102,161],"provided":[103],"with":[104,182],"accurate":[105],"instructions.":[106],"To":[107],"address":[108],"issues,":[110],"letter":[112],"proposes":[113],"ReplanVLM":[115],"framework":[116],"In":[121],"study,":[123],"we":[124],"focus":[125],"on":[126,167],"error":[127,132,138,159,188],"correction":[128,133,139,189],"interventions.":[129],"An":[130],"internal":[131],"mechanism":[134,140],"an":[136],"external":[137],"are":[141],"presented":[142],"correct":[144,158],"errors":[145],"under":[146],"corresponding":[147],"phases.":[148],"A":[149],"replan":[150,155],"strategy":[151],"is":[152],"developed":[153],"tasks":[156],"or":[157],"codes":[160],"fails.":[164],"Experimental":[165],"results":[166],"real":[168],"robots":[169],"simulation":[172],"environments":[173],"demonstrated":[175],"superiority":[177],"proposed":[180],"framework,":[181],"higher":[183],"success":[184],"rates":[185],"robust":[187],"capabilities":[190],"open-world":[192],"tasks.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":25},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
