{"id":"https://openalex.org/W4413945178","doi":"https://doi.org/10.1109/icra55743.2025.11128658","title":"SYNERGAI: Perception Alignment for Human-Robot Collaboration","display_name":"SYNERGAI: Perception Alignment for Human-Robot Collaboration","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413945178","doi":"https://doi.org/10.1109/icra55743.2025.11128658"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11128658","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128658","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100393448","display_name":"Yixin Chen","orcid":"https://orcid.org/0000-0002-8176-0241"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yixin Chen","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072114355","display_name":"Icy Zhang","orcid":"https://orcid.org/0000-0003-3423-6794"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"I Guoxi Zhang","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057634765","display_name":"Yaowei Zhang","orcid":"https://orcid.org/0000-0001-7756-6756"},"institutions":[{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaowei Zhang","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101554514","display_name":"Hongming Xu","orcid":"https://orcid.org/0009-0009-6255-263X"},"institutions":[{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongming Xu","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087547525","display_name":"Peiyuan Zhi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peiyuan Zhi","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076353062","display_name":"Qing Li","orcid":"https://orcid.org/0009-0008-8404-3695"},"institutions":[{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Li","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067080265","display_name":"Siyuan Huang","orcid":"https://orcid.org/0000-0003-1524-7148"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4392738278","display_name":"Beijing Institute for General Artificial Intelligence","ror":"https://ror.org/02kw1ws04","country_code":null,"type":"facility","lineage":["https://openalex.org/I4392738278"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Huang","raw_affiliation_strings":["Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Beijing Institute for General Artificial Intelligence (BIGAI),State Key Laboratory of General Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100393448"],"corresponding_institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4392738278"],"apc_list":null,"apc_paid":null,"fwci":1.2604,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.83867813,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3095","last_page":"3102"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9096999764442444,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.6818378567695618},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6611291170120239},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6039596796035767},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.6006109714508057},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.49997782707214355},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4187481999397278},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36569246649742126},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.13655990362167358}],"concepts":[{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.6818378567695618},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6611291170120239},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6039596796035767},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.6006109714508057},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.49997782707214355},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4187481999397278},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36569246649742126},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.13655990362167358},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11128658","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128658","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2012201897","https://openalex.org/W2175286647","https://openalex.org/W2293700449","https://openalex.org/W2594519801","https://openalex.org/W2970340522","https://openalex.org/W2990129662","https://openalex.org/W3010276570","https://openalex.org/W3035154952","https://openalex.org/W3095974555","https://openalex.org/W3107521863","https://openalex.org/W3172675210","https://openalex.org/W3182910454","https://openalex.org/W3192660112","https://openalex.org/W3197501724","https://openalex.org/W3203663566","https://openalex.org/W3207711849","https://openalex.org/W4206504561","https://openalex.org/W4221167937","https://openalex.org/W4225675121","https://openalex.org/W4226236972","https://openalex.org/W4226376247","https://openalex.org/W4233857083","https://openalex.org/W4283332944","https://openalex.org/W4383097638","https://openalex.org/W4386251907","https://openalex.org/W4390872495","https://openalex.org/W4390874280","https://openalex.org/W4401414715","https://openalex.org/W4401991200","https://openalex.org/W4402961736","https://openalex.org/W4403600470"],"related_works":["https://openalex.org/W4392646554","https://openalex.org/W2978665606","https://openalex.org/W3205513966","https://openalex.org/W3120459843","https://openalex.org/W4366547574","https://openalex.org/W189465620","https://openalex.org/W4366818884","https://openalex.org/W2248308732","https://openalex.org/W4392651289","https://openalex.org/W3042490037"],"abstract_inverted_index":{"Recently,":[0],"large":[1],"language":[2],"models":[3,130],"(LLMs)":[4],"have":[5],"shown":[6],"strong":[7],"potential":[8],"in":[9,87,131,133,148,161],"facilitating":[10],"human-robotic":[11],"interaction":[12],"and":[13,25,33,53,68,83],"collaboration.":[14,55],"However,":[15],"existing":[16],"LLM-based":[17],"systems":[18],"often":[19],"overlook":[20],"the":[21,73,95,128,168,181],"misalignment":[22,112],"between":[23],"human":[24],"robot":[26,35],"perceptions,":[27],"which":[28],"hinders":[29],"their":[30],"effective":[31],"communication":[32],"real-world":[34,142],"deployment.":[36],"To":[37],"address":[38],"this":[39],"issue,":[40],"we":[41],"introduce":[42],"SYNERGAI,":[43],"a":[44,134,155],"unified":[45],"system":[46,74],"designed":[47],"to":[48,75,78,90,173],"achieve":[49],"both":[50],"perceptual":[51,111],"alignment":[52,162],"human-robot":[54],"At":[56],"its":[57,66,98,118,146],"core,":[58],"SYNERGAI":[59,104,123,144],"employs":[60],"3D":[61],"Scene":[62],"Graph":[63],"(3DSG)":[64],"as":[65],"explicit":[67],"innate":[69],"representation.":[70],"This":[71],"enables":[72,110],"leverage":[76],"LLM":[77],"break":[79],"down":[80],"complex":[81],"tasks":[82,178],"allocate":[84],"appropriate":[85],"tools":[86],"intermediate":[88],"steps":[89],"extract":[91],"relevant":[92],"information":[93],"from":[94,171],"3DSG,":[96],"modify":[97],"structure,":[99],"or":[100],"generate":[101],"responses.":[102],"Importantly,":[103],"incorporates":[105],"an":[106],"automatic":[107],"mechanism":[108],"that":[109],"correction":[113],"with":[114,120,127,152],"users":[115],"by":[116,179],"updating":[117],"3DSG":[119],"online":[121],"interaction.":[122],"achieves":[124],"comparable":[125],"performance":[126],"data-driven":[129],"ScanQA":[132],"zero-shot":[135],"manner.":[136],"Through":[137],"comprehensive":[138],"experiments":[139],"across":[140],"10":[141],"scenes,":[143],"demonstrates":[145],"effectiveness":[147],"establishing":[149],"common":[150],"ground":[151],"humans,":[153],"realizing":[154],"success":[156,169],"rate":[157,170],"of":[158],"61.9":[159],"%":[160,175],"tasks.":[163],"It":[164],"also":[165],"significantly":[166],"improves":[167],"3.7%":[172],"45.68":[174],"on":[176],"novel":[177],"transferring":[180],"knowledge":[182],"acquired":[183],"during":[184],"alignment.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
