{"id":"https://openalex.org/W4405785418","doi":"https://doi.org/10.1109/iros58592.2024.10801466","title":"Visual Imitation Learning of Task-Oriented Object Grasping and Rearrangement","display_name":"Visual Imitation Learning of Task-Oriented Object Grasping and Rearrangement","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405785418","doi":"https://doi.org/10.1109/iros58592.2024.10801466"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801466","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101889418","display_name":"Yichen Cai","orcid":"https://orcid.org/0000-0003-0950-3504"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Yichen Cai","raw_affiliation_strings":["Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047233371","display_name":"Jianfeng Gao","orcid":"https://orcid.org/0000-0002-6371-505X"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jianfeng Gao","raw_affiliation_strings":["Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061699262","display_name":"Christoph Pohl","orcid":"https://orcid.org/0000-0002-4206-3312"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christoph Pohl","raw_affiliation_strings":["Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012730104","display_name":"Tamim Asfour","orcid":"https://orcid.org/0000-0003-4879-7680"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tamim Asfour","raw_affiliation_strings":["Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany"],"affiliations":[{"raw_affiliation_string":"Karlsruhe Institute of Technology,Institute for Anthropomatics and Robotics,Karlsruhe,Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101889418"],"corresponding_institution_ids":["https://openalex.org/I102335020"],"apc_list":null,"apc_paid":null,"fwci":1.7438,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.8574076,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"364","last_page":"371"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.954200029373169,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9103000164031982,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.680736243724823},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.6585770845413208},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6369059681892395},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.531014621257782},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48328402638435364},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.46470728516578674},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4362139105796814},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.430868923664093},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.4062165915966034},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.29632365703582764},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.14912796020507812},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09634906053543091}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.680736243724823},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.6585770845413208},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6369059681892395},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.531014621257782},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48328402638435364},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.46470728516578674},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4362139105796814},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.430868923664093},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.4062165915966034},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.29632365703582764},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.14912796020507812},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09634906053543091},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801466","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.4399999976158142}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W2550600634","https://openalex.org/W2772168088","https://openalex.org/W2773765248","https://openalex.org/W2783693550","https://openalex.org/W2798314605","https://openalex.org/W2802065399","https://openalex.org/W2889668339","https://openalex.org/W2925241625","https://openalex.org/W2963627347","https://openalex.org/W2963677766","https://openalex.org/W2963926543","https://openalex.org/W2969694596","https://openalex.org/W2970710335","https://openalex.org/W2976611405","https://openalex.org/W2982369787","https://openalex.org/W3003783003","https://openalex.org/W3004105558","https://openalex.org/W3035872421","https://openalex.org/W3127246939","https://openalex.org/W3133699737","https://openalex.org/W3134664367","https://openalex.org/W3135359526","https://openalex.org/W3158545781","https://openalex.org/W3175388581","https://openalex.org/W3201312429","https://openalex.org/W3207187156","https://openalex.org/W3207755626","https://openalex.org/W4214684804","https://openalex.org/W4221149779","https://openalex.org/W4285102336","https://openalex.org/W4297846303","https://openalex.org/W4313003756","https://openalex.org/W4383108370","https://openalex.org/W4385062417","https://openalex.org/W4387350597","https://openalex.org/W4387790173","https://openalex.org/W4390872744","https://openalex.org/W4390874575","https://openalex.org/W4401414765","https://openalex.org/W4404612908","https://openalex.org/W6687484953","https://openalex.org/W6752823625","https://openalex.org/W6784172082","https://openalex.org/W6800004206","https://openalex.org/W6843515625","https://openalex.org/W6846496272","https://openalex.org/W6854050737","https://openalex.org/W6856840598","https://openalex.org/W6875719230"],"related_works":["https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2778153218","https://openalex.org/W1531601525","https://openalex.org/W2732813147","https://openalex.org/W2143460112","https://openalex.org/W2042906257","https://openalex.org/W3196817267","https://openalex.org/W1976600725"],"abstract_inverted_index":{"Task-oriented":[0],"object":[1,47,59,77,88,113],"grasping":[2,114],"and":[3,29,57,97,115,138,151],"rearrangement":[4,116],"are":[5],"key":[6],"skills":[7],"for":[8,136],"robots,":[9],"which":[10],"have":[11],"to":[12,23,110],"perform":[13],"versatile":[14],"real-world":[15],"manipulation":[16,156],"tasks.":[17,157],"However,":[18],"they":[19],"remain":[20],"challenging":[21],"due":[22],"partial":[24,92],"observations":[25],"of":[26,146,155],"the":[27,40,76,133,144],"objects":[28],"shape":[30,89,94],"variations":[31],"in":[32,60,80,87,126,149],"categorical":[33],"objects.":[34,102],"In":[35],"this":[36],"paper,":[37],"we":[38,106],"present":[39],"Multi-feature":[41],"Implicit":[42],"Model":[43],"(MIMO),":[44],"a":[45,55,67,108],"novel":[46],"representation":[48],"that":[49,73,129],"encodes":[50],"multiple":[51,70,120],"spatial":[52,99],"features":[53,71],"between":[54,101],"point":[56],"an":[58,61],"implicit":[62],"neural":[63],"field.":[64],"Training":[65],"such":[66],"model":[68],"on":[69,104],"ensures":[72],"it":[74],"embeds":[75],"shapes":[78],"consistently":[79],"different":[81],"aspects,":[82],"thus":[83],"improving":[84],"its":[85],"performance":[86],"reconstruction":[90],"from":[91,117],"observation,":[93],"similarity":[95],"measure,":[96],"modeling":[98],"relations":[100],"Based":[103],"MIMO,":[105],"propose":[107],"framework":[109],"learn":[111],"task-oriented":[112],"single":[118],"or":[119],"human":[121],"demonstration":[122],"videos.":[123],"The":[124],"evaluations":[125],"simulation":[127],"show":[128],"our":[130,147],"approach":[131,148],"outperforms":[132],"state-of-the-art":[134],"methods":[135],"multi-":[137],"single-view":[139],"observations.":[140],"Real-world":[141],"experiments":[142],"demonstrate":[143],"efficacy":[145],"one-":[150],"few-shot":[152],"imitation":[153],"learning":[154]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
