{"id":"https://openalex.org/W7127149834","doi":"https://doi.org/10.1109/tase.2026.3660080","title":"Cooperative Control Framework for Dual-Arm Robot Enhanced by Vision Language Model and Reinforcement Learning","display_name":"Cooperative Control Framework for Dual-Arm Robot Enhanced by Vision Language Model and Reinforcement Learning","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7127149834","doi":"https://doi.org/10.1109/tase.2026.3660080"},"language":null,"primary_location":{"id":"doi:10.1109/tase.2026.3660080","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2026.3660080","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064090676","display_name":"Chen Guangrong","orcid":"https://orcid.org/0000-0003-1903-8597"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guangrong Chen","raw_affiliation_strings":["Robotics Research Center, Beijing Jiaotong University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Robotics Research Center, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124810203","display_name":"Qizhe Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qizhe Yang","raw_affiliation_strings":["Robotics Research Center, Beijing Jiaotong University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Robotics Research Center, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124842451","display_name":"Jiehao Li","orcid":null},"institutions":[{"id":"https://openalex.org/I101479585","display_name":"South China Agricultural University","ror":"https://ror.org/05v9jqt67","country_code":"CN","type":"education","lineage":["https://openalex.org/I101479585"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiehao Li","raw_affiliation_strings":["National Key Laboratory of Agricultural Equipment Technology, South China Agricultural University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Agricultural Equipment Technology, South China Agricultural University, Guangzhou, China","institution_ids":["https://openalex.org/I101479585"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124751010","display_name":"C. L. Philip Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"C. L. Philip Chen","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124760997","display_name":"Chenguang Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chenguang Yang","raw_affiliation_strings":["School of Computer Science and Informatics, University of Liverpool, Liverpool, U.K"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Informatics, University of Liverpool, Liverpool, U.K","institution_ids":["https://openalex.org/I146655781"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5064090676"],"corresponding_institution_ids":["https://openalex.org/I21193070"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54161082,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"23","issue":null,"first_page":"4314","last_page":"4328"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.006200000178068876,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.006200000178068876,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7688999772071838},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6420000195503235},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6194000244140625},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5641000270843506},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.5335000157356262},{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.5317000150680542},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4675999879837036},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.4641999900341034},{"id":"https://openalex.org/keywords/visual-servoing","display_name":"Visual servoing","score":0.43549999594688416},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4023999869823456}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7688999772071838},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6495000123977661},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6420000195503235},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6194000244140625},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5641000270843506},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.5335000157356262},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.5317000150680542},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5218999981880188},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4675999879837036},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.4641999900341034},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.43549999594688416},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4023999869823456},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.391400009393692},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3831999897956848},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.37049999833106995},{"id":"https://openalex.org/C2777984285","wikidata":"https://www.wikidata.org/wiki/Q17098134","display_name":"Impedance control","level":3,"score":0.362199991941452},{"id":"https://openalex.org/C2775960376","wikidata":"https://www.wikidata.org/wiki/Q1435859","display_name":"Grippers","level":2,"score":0.34279999136924744},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3346000015735626},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.33149999380111694},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.32190001010894775},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32010000944137573},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.3172000050544739},{"id":"https://openalex.org/C2776126113","wikidata":"https://www.wikidata.org/wiki/Q1128980","display_name":"Industrial robot","level":3,"score":0.31049999594688416},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.28540000319480896},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2777000069618225},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.27570000290870667},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27320000529289246},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2727999985218048},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.257099986076355},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2524000108242035},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.25110000371932983},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.250900000333786},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2026.3660080","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2026.3660080","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W2119717200","https://openalex.org/W2910474428","https://openalex.org/W3004014436","https://openalex.org/W3081176596","https://openalex.org/W4220668453","https://openalex.org/W4289690297","https://openalex.org/W4305057154","https://openalex.org/W4318580237","https://openalex.org/W4366386348","https://openalex.org/W4367663367","https://openalex.org/W4384300270","https://openalex.org/W4386001306","https://openalex.org/W4390968395","https://openalex.org/W4392853795","https://openalex.org/W4401109918","https://openalex.org/W4405787412","https://openalex.org/W4406613045","https://openalex.org/W4406692054","https://openalex.org/W4407025919","https://openalex.org/W4407432879","https://openalex.org/W4407956841","https://openalex.org/W4412735855","https://openalex.org/W4413104923","https://openalex.org/W4413144615","https://openalex.org/W4413362511","https://openalex.org/W4413817082","https://openalex.org/W4413822376"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,33,184],"cooperative":[4,139],"control":[5,77],"framework":[6,31,175],"for":[7,187],"dual-arm":[8,134],"robots":[9],"that":[10,172],"integrates":[11],"vision-language":[12],"models":[13],"(VLMs)":[14],"with":[15,163,180],"online":[16,58,164],"reinforcement":[17],"learning":[18,166],"(RL)":[19],"to":[20,49,96,103,116,161],"enhance":[21],"autonomy":[22],"and":[23,46,64,71,82,87,109,123,148,167,195],"adaptability":[24],"in":[25,154,190],"complex":[26],"manipulation":[27,62],"tasks.":[28],"The":[29,133],"proposed":[30,131,174],"adopts":[32],"hierarchical":[34],"architecture:":[35],"at":[36,53,72],"the":[37,40,54,73,91,98,105,127,130,155,173],"top":[38],"level,":[39,56,75],"VLM":[41],"interprets":[42],"natural":[43],"language":[44],"instructions":[45],"visual":[47],"image":[48],"generate":[50],"task":[51,119,156],"plans;":[52],"middle":[55],"an":[57,152],"RL":[59],"module":[60],"refines":[61],"policies":[63],"ensures":[65],"adaptive":[66,165],"decision-making":[67],"under":[68],"environmental":[69],"uncertainty;":[70],"bottom":[74],"compliant":[76],"based":[78],"on":[79],"trajectory":[80],"planning":[81],"impedance":[83],"regulation":[84],"enables":[85],"safe":[86],"robust":[88],"execution.":[89],"In":[90],"feedback,":[92],"YOLOv5":[93],"is":[94,101,114,120],"used":[95,102,115],"detect":[97],"object,":[99],"GraspNet":[100],"obtain":[104],"optimal":[106],"grasp":[107],"pose,":[108],"CLIP":[110],"(Contrastive":[111],"Language-Image":[112],"Pre-Training)":[113],"judge":[117],"whether":[118],"completed.":[121],"Simulations":[122],"real-world":[124],"experiments":[125],"validate":[126],"effectiveness":[128],"of":[129],"method.":[132],"robot":[135],"successfully":[136],"performed":[137],"various":[138],"tasks":[140],"such":[141],"as":[142],"grasping,":[143],"bottle-cap":[144],"unscrewing,":[145],"water":[146],"pouring,":[147],"box":[149],"carrying,":[150],"achieving":[151],"increase":[153],"success":[157],"rate":[158],"from":[159],"43%":[160],"100%":[162],"training.":[168],"These":[169],"results":[170],"demonstrate":[171],"effectively":[176],"bridges":[177],"high-level":[178],"reasoning":[179],"low-level":[181],"control,":[182],"providing":[183],"scalable":[185],"solution":[186],"future":[188],"applications":[189],"service":[191],"robotics,":[192],"industrial":[193],"automation,":[194],"human-robot":[196],"collaboration.":[197]},"counts_by_year":[],"updated_date":"2026-02-13T13:36:01.753593","created_date":"2026-02-03T00:00:00"}
