{"id":"https://openalex.org/W4406629159","doi":"https://doi.org/10.1017/s0263574724001322","title":"A multi-modal learning method for pick-and-place task based on human demonstration","display_name":"A multi-modal learning method for pick-and-place task based on human demonstration","publication_year":2024,"publication_date":"2024-10-01","ids":{"openalex":"https://openalex.org/W4406629159","doi":"https://doi.org/10.1017/s0263574724001322"},"language":"en","primary_location":{"id":"doi:10.1017/s0263574724001322","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0263574724001322","pdf_url":null,"source":{"id":"https://openalex.org/S92163612","display_name":"Robotica","issn_l":"0263-5747","issn":["0263-5747","1469-8668"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotica","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107886677","display_name":"David Yu","orcid":"https://orcid.org/0009-0003-6198-5130"},"institutions":[{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Diqing Yu","raw_affiliation_strings":["Zhejiang University of Technology, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University of Technology, Hangzhou, China","institution_ids":["https://openalex.org/I55712492"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056303212","display_name":"Xinggang Fan","orcid":"https://orcid.org/0000-0001-5325-1231"},"institutions":[{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]},{"id":"https://openalex.org/I4210104064","display_name":"Shenzhen Academy of Robotics","ror":"https://ror.org/01h027j09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210104064"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinggang Fan","raw_affiliation_strings":["Shenzhen Academy of Robotics, Shenzhen, China","Zhejiang University of Technology, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Academy of Robotics, Shenzhen, China","institution_ids":["https://openalex.org/I4210104064"]},{"raw_affiliation_string":"Zhejiang University of Technology, Hangzhou, China","institution_ids":["https://openalex.org/I55712492"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036718385","display_name":"Yaonan Li","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104064","display_name":"Shenzhen Academy of Robotics","ror":"https://ror.org/01h027j09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210104064"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yaonan Li","raw_affiliation_strings":["Shenzhen Academy of Robotics, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Academy of Robotics, Shenzhen, China","institution_ids":["https://openalex.org/I4210104064"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101688278","display_name":"Heping Chen","orcid":"https://orcid.org/0000-0002-1045-8977"},"institutions":[{"id":"https://openalex.org/I4210104064","display_name":"Shenzhen Academy of Robotics","ror":"https://ror.org/01h027j09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210104064"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heping Chen","raw_affiliation_strings":["Shenzhen Academy of Robotics, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Academy of Robotics, Shenzhen, China","institution_ids":["https://openalex.org/I4210104064"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113212378","display_name":"Han Li","orcid":"https://orcid.org/0009-0008-6668-0906"},"institutions":[{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Han Li","raw_affiliation_strings":["Zhejiang University of Technology, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University of Technology, Hangzhou, China","institution_ids":["https://openalex.org/I55712492"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109712901","display_name":"Yongrui Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104064","display_name":"Shenzhen Academy of Robotics","ror":"https://ror.org/01h027j09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210104064"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuao Jin","raw_affiliation_strings":["Shenzhen Academy of Robotics, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Academy of Robotics, Shenzhen, China","institution_ids":["https://openalex.org/I4210104064"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5036718385"],"corresponding_institution_ids":["https://openalex.org/I4210104064"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26696977,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"42","issue":"10","first_page":"3302","last_page":"3323"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9726999998092651,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9726999998092651,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9430999755859375,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7087740898132324},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6790252923965454},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6711519956588745},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.543212354183197},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5163522958755493},{"id":"https://openalex.org/keywords/smt-placement-equipment","display_name":"SMT placement equipment","score":0.4775843918323517},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3313307762145996},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23444345593452454},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.17978596687316895},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.16682583093643188}],"concepts":[{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7087740898132324},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6790252923965454},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6711519956588745},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.543212354183197},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5163522958755493},{"id":"https://openalex.org/C17511633","wikidata":"https://www.wikidata.org/wiki/Q830694","display_name":"SMT placement equipment","level":3,"score":0.4775843918323517},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3313307762145996},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23444345593452454},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.17978596687316895},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.16682583093643188},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s0263574724001322","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0263574724001322","pdf_url":null,"source":{"id":"https://openalex.org/S92163612","display_name":"Robotica","issn_l":"0263-5747","issn":["0263-5747","1469-8668"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotica","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3119180176","https://openalex.org/W2786561194","https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W3196817267","https://openalex.org/W1976600725","https://openalex.org/W2052750075","https://openalex.org/W3045301645","https://openalex.org/W2039843023","https://openalex.org/W1595374691"],"abstract_inverted_index":{"Abstract":[0],"Robot":[1],"pick-and-place":[2,25,76,98],"for":[3,20],"unknown":[4],"objects":[5],"is":[6,107],"still":[7],"a":[8,16],"very":[9],"challenging":[10],"research":[11],"topic.":[12],"This":[13,27],"paper":[14],"proposes":[15],"multi-modal":[17,84],"learning":[18],"method":[19,28,49,53,82],"robot":[21,93],"one-shot":[22,47],"imitation":[23,48],"of":[24,34,41,75,91,116],"tasks.":[26],"aims":[29],"to":[30,70,109],"enhance":[31],"the":[32,39,46,81,89,92,96,111],"generality":[33],"industrial":[35,101,128],"robots":[36],"while":[37],"reducing":[38],"amount":[40],"data":[42],"and":[43,62,86,94,120,127,133,142,149,155],"training":[44],"costs":[45],"relies":[50],"on.":[51],"The":[52,113],"first":[54],"categorizes":[55],"human":[56,117],"demonstration":[57,118],"videos":[58,119],"into":[59,67],"different":[60],"tasks,":[61,129],"these":[63],"tasks":[64,77],"are":[65],"classified":[66],"six":[68],"types":[69,74],"symbolize":[71],"as":[72,78],"many":[73],"possible.":[79],"Second,":[80],"generates":[83],"prompts":[85],"finally":[87],"predicts":[88],"action":[90],"completes":[95],"symbolic":[97],"task":[99],"in":[100,146],"production.":[102],"A":[103],"carefully":[104],"curated":[105],"dataset":[106,114],"created":[108],"complement":[110],"method.":[112],"consists":[115],"instance":[121],"images":[122],"focused":[123],"on":[124],"real-world":[125,150],"scenes":[126],"which":[130],"fosters":[131],"adaptable":[132],"efficient":[134],"learning.":[135],"Experimental":[136],"results":[137,144],"demonstrate":[138],"favorable":[139],"success":[140],"rates":[141],"loss":[143],"both":[145],"simulation":[147],"environments":[148],"experiments,":[151],"confirming":[152],"its":[153],"effectiveness":[154],"practicality.":[156]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
