{"id":"https://openalex.org/W4416251895","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228672","title":"LLM-based Interactive Imitation Learning for Robotic Manipulation","display_name":"LLM-based Interactive Imitation Learning for Robotic Manipulation","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416251895","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228672"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11228672","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064003089","display_name":"Jonas Werner","orcid":"https://orcid.org/0000-0002-4068-0018"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Jonas Werner","raw_affiliation_strings":["University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055384333","display_name":"Kun Chu","orcid":null},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Kun Chu","raw_affiliation_strings":["University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102025003","display_name":"Cornelius Weber","orcid":"https://orcid.org/0000-0001-5163-938X"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Cornelius Weber","raw_affiliation_strings":["University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076224149","display_name":"Stefan Wermter","orcid":null},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stefan Wermter","raw_affiliation_strings":["University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Hamburg,Knowledge Technology,Department of Informatics,Hamburg,Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5064003089"],"corresponding_institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"],"apc_list":null,"apc_paid":null,"fwci":2.1886,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.90128344,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.38499999046325684,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.38499999046325684,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.21549999713897705,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.07039999961853027,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5139999985694885},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.5005000233650208},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.4438000023365021},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.4189000129699707},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.40790000557899475},{"id":"https://openalex.org/keywords/interactive-learning","display_name":"Interactive Learning","score":0.3741999864578247},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.367900013923645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7218000292778015},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5921000242233276},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5860999822616577},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5139999985694885},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.5005000233650208},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.4438000023365021},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.4189000129699707},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.40790000557899475},{"id":"https://openalex.org/C2776716048","wikidata":"https://www.wikidata.org/wiki/Q6045290","display_name":"Interactive Learning","level":2,"score":0.3741999864578247},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.367900013923645},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3352999985218048},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3343000113964081},{"id":"https://openalex.org/C121050878","wikidata":"https://www.wikidata.org/wiki/Q5135020","display_name":"Cloning (programming)","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.29510000348091125},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.2815000116825104},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.27799999713897705},{"id":"https://openalex.org/C2779305910","wikidata":"https://www.wikidata.org/wiki/Q5172809","display_name":"Corrective feedback","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2581999897956848}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11228672","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322725","display_name":"China Scholarship Council","ror":"https://ror.org/04atp4p48"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2031571562","https://openalex.org/W2053910308","https://openalex.org/W2076337359","https://openalex.org/W2174803659","https://openalex.org/W2792217087","https://openalex.org/W2794908222","https://openalex.org/W3007769740","https://openalex.org/W3185341429","https://openalex.org/W3202542428","https://openalex.org/W4312361190","https://openalex.org/W4383097638","https://openalex.org/W4383108457","https://openalex.org/W4385245566","https://openalex.org/W4385572162","https://openalex.org/W4389665575","https://openalex.org/W4394828156","https://openalex.org/W4399374221","https://openalex.org/W4404953341","https://openalex.org/W4413925071"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advancements":[1],"in":[2,20,52,98,142,146,203,224],"machine":[3],"learning":[4,226],"provide":[5],"methods":[6,172],"to":[7,32,65,83,120],"train":[8],"autonomous":[9],"agents":[10,30,64],"capable":[11],"of":[12,17,86,93,213,218],"handling":[13],"the":[14,45,84,90,126,140,164,204,216,231],"increasing":[15],"complexity":[16],"sequential":[18],"decision-making":[19],"robotics.":[21],"Imitation":[22,56],"Learning":[23,57],"(IL)":[24],"is":[25],"a":[26,108,134,144,151,183,188],"prominent":[27],"approach,":[28],"where":[29],"learn":[31,66],"control":[33],"robots":[34],"based":[35],"on":[36,128,191,239],"human":[37,71,87,129,189],"demonstrations.":[38],"However,":[39],"IL":[40,179],"commonly":[41],"suffers":[42],"from":[43,67,70],"violating":[44],"independent":[46],"and":[47,100,159,181,207,244],"identically":[48],"distributed":[49],"(i.i.d)":[50],"assumption":[51],"robotic":[53,193],"tasks.":[54,195,241],"Interactive":[55],"(IIL)":[58],"achieves":[59,208],"improved":[60],"performance":[61,123],"by":[62,236],"allowing":[63],"interactive":[68,118,225],"feedback":[69,154,161],"teachers.":[72],"Despite":[73],"these":[74],"improvements,":[75],"both":[76],"approaches":[77],"come":[78],"with":[79,150],"significant":[80],"costs":[81],"due":[82],"necessity":[85],"involvement.":[88],"Leveraging":[89],"emergent":[91],"capabilities":[92],"Large":[94],"Language":[95],"Models":[96],"(LLMs)":[97],"reasoning":[99],"generating":[101,143],"human-like":[102,222],"responses,":[103],"we":[104],"introduce":[105],"LLM-iTeach":[106,132,156,169,200],"\u2014":[107],"novel":[109],"IIL":[110,185],"framework":[111],"that":[112,138,199,212],"utilizes":[113],"an":[114,117,178],"LLM":[115,141],"as":[116,174,220],"teacher":[119],"enhance":[121],"agent":[122],"while":[124],"alleviating":[125],"dependence":[127],"resources.":[130],"Firstly,":[131],"uses":[133],"hierarchical":[135],"prompting":[136],"strategy":[137],"guides":[139],"policy":[145],"Python":[147],"code.":[148],"Then,":[149],"designed":[152],"similarity-based":[153],"mechanism,":[155],"provides":[157],"corrective":[158],"evaluative":[160],"interactively":[162],"during":[163],"agent\u2019s":[165],"training.":[166],"We":[167,228],"evaluate":[168],"against":[170],"baseline":[171],"such":[173],"Behavior":[175],"Cloning":[176],"(BC),":[177],"method,":[180],"CEILing,":[182,214],"state-of-the-art":[184],"method":[186],"using":[187],"teacher,":[190],"various":[192],"manipulation":[194],"Our":[196],"results":[197],"demonstrate":[198,230],"surpasses":[201],"BC":[202],"success":[205],"rate":[206],"or":[209],"even":[210],"outscores":[211],"highlighting":[215],"potential":[217,233],"LLMs":[219],"cost-effective,":[221],"teachers":[223],"environments.":[227],"further":[229],"method\u2019s":[232],"for":[234],"generalization":[235],"evaluating":[237],"it":[238],"additional":[240],"The":[242],"code":[243],"prompts":[245],"are":[246],"provided":[247],"at:":[248],"https://github.com/Tubicor/LLM-iTeach.":[249]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-11-14T00:00:00"}
