{"id":"https://openalex.org/W4417189940","doi":"https://doi.org/10.1145/3761668.3761711","title":"LLM and VLM-Assisted Human-Robot Collaboration Framework for Smart Assembly Cells","display_name":"LLM and VLM-Assisted Human-Robot Collaboration Framework for Smart Assembly Cells","publication_year":2025,"publication_date":"2025-06-13","ids":{"openalex":"https://openalex.org/W4417189940","doi":"https://doi.org/10.1145/3761668.3761711"},"language":null,"primary_location":{"id":"doi:10.1145/3761668.3761711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3761668.3761711","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 17th International Conference on Computer Modeling and Simulation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3761668.3761711","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120740188","display_name":"Wenbin Liang","orcid":"https://orcid.org/0009-0009-0432-2297"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenbin Liang","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108312456","display_name":"Yufei Shen","orcid":"https://orcid.org/0009-0005-8554-4158"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufei Shen","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036472198","display_name":"Li Yin","orcid":"https://orcid.org/0009-0001-9319-403X"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Yin","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111904560","display_name":"Shu-Chun Yang","orcid":"https://orcid.org/0009-0004-6496-7795"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shanglang Yang","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100732083","display_name":"Mingxing Li","orcid":"https://orcid.org/0000-0003-3202-0877"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingxing Li","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021504878","display_name":"Ting Qu","orcid":"https://orcid.org/0000-0003-1012-2856"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Qu","raw_affiliation_strings":["School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Science and Engineering, Jinan University, Zhuhai, China","institution_ids":["https://openalex.org/I159948400"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5120740188"],"corresponding_institution_ids":["https://openalex.org/I159948400"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.48827655,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"278","last_page":"286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.2150000035762787,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.2150000035762787,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.20800000429153442,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10763","display_name":"Digital Transformation in Industry","score":0.11089999973773956,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.7225000262260437},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5835000276565552},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5663999915122986},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5303999781608582},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4763000011444092},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4675000011920929},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.42879998683929443},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.40950000286102295}],"concepts":[{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.7225000262260437},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5875999927520752},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5835000276565552},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5663999915122986},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5303999781608582},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4763000011444092},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4675000011920929},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4440000057220459},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.42879998683929443},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.40950000286102295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39969998598098755},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.38670000433921814},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3781000077724457},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3637000024318695},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.33160001039505005},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.3303999900817871},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.30250000953674316},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.29409998655319214},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2614000141620636},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.25440001487731934},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3761668.3761711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3761668.3761711","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 17th International Conference on Computer Modeling and Simulation","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3761668.3761711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3761668.3761711","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 17th International Conference on Computer Modeling and Simulation","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2043536379","https://openalex.org/W2418222507","https://openalex.org/W2555671188","https://openalex.org/W2885146195","https://openalex.org/W2933531560","https://openalex.org/W2955189310","https://openalex.org/W3131771889","https://openalex.org/W3200915045","https://openalex.org/W4379054524"],"related_works":[],"abstract_inverted_index":{"While":[0],"Industry":[1],"4.0":[2],"drives":[3],"demand":[4],"for":[5,94],"adaptive":[6],"human-robot":[7,44],"collaboration,":[8],"challenges":[9],"persist":[10],"in":[11],"robotic":[12],"intelligence,":[13],"computational":[14],"efficiency,":[15],"and":[16,27,66,76,91],"unstructured-environment":[17],"adaptability.":[18],"This":[19,80],"study":[20],"proposes":[21],"integrating":[22],"Large":[23],"Language":[24],"Models":[25,29],"(LLMs)":[26],"Vision-Language":[28],"(VLMs)":[30],"to":[31,51,88],"enhance":[32],"collaborative":[33],"assembly":[34],"systems.":[35],"LLMs":[36],"translate":[37],"natural":[38],"language":[39],"into":[40],"machine-executable":[41],"commands,":[42],"simplifying":[43],"interaction.":[45],"VLMs":[46],"process":[47],"camera-captured":[48],"color/depth":[49],"data":[50],"construct":[52],"perceptual":[53],"spaces,":[54],"improving":[55],"environmental":[56],"awareness":[57],"with":[58],"minimal":[59],"training":[60],"data.":[61],"By":[62],"combining":[63],"LLM-generated":[64],"instructions":[65],"VLM-derived":[67],"spatial":[68],"insights,":[69],"the":[70],"system":[71],"enables":[72],"autonomous":[73],"trajectory":[74],"planning":[75],"optimized":[77],"motion":[78],"control.":[79],"dual-model":[81],"framework":[82],"reduces":[83],"operational":[84],"complexity,":[85],"enhances":[86],"adaptability":[87],"unstructured":[89],"scenarios,":[90],"improves":[92],"generalization":[93],"modern":[95],"manufacturing's":[96],"evolving":[97],"demands.":[98]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-10T00:00:00"}
