{"id":"https://openalex.org/W4313060564","doi":"https://doi.org/10.1109/iros47612.2022.9981669","title":"Deep Reinforcement Learning Based on Local GNN for Goal-Conditioned Deformable Object Rearranging","display_name":"Deep Reinforcement Learning Based on Local GNN for Goal-Conditioned Deformable Object Rearranging","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W4313060564","doi":"https://doi.org/10.1109/iros47612.2022.9981669"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9981669","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981669","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2302.10446","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052849786","display_name":"Yuhong Deng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuhong Deng","raw_affiliation_strings":["Tencent Robotics X Lab,Shenzhen,China","Tencent Robotics X Lab, Shenzhen, China","The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent Robotics X Lab,Shenzhen,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Robotics X Lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014423743","display_name":"Chongkun Xia","orcid":"https://orcid.org/0000-0001-5396-7643"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chongkun Xia","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School,The Center for Intelligent Control and Telescience,Shenzhen,China","The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School,The Center for Intelligent Control and Telescience,Shenzhen,China","institution_ids":[]},{"raw_affiliation_string":"The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100737125","display_name":"Xueqian Wang","orcid":"https://orcid.org/0000-0003-3542-0593"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xueqian Wang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School,The Center for Intelligent Control and Telescience,Shenzhen,China","The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School,The Center for Intelligent Control and Telescience,Shenzhen,China","institution_ids":[]},{"raw_affiliation_string":"The Center for Intelligent Control and Telescience, Tsinghua Shenzhen International Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102898812","display_name":"Lipeng Chen","orcid":"https://orcid.org/0000-0003-2169-2766"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lipeng Chen","raw_affiliation_strings":["Tencent Robotics X Lab,Shenzhen,China","Tencent Robotics X Lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent Robotics X Lab,Shenzhen,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Robotics X Lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5052849786"],"corresponding_institution_ids":["https://openalex.org/I2250653659","https://openalex.org/I4210114105"],"apc_list":null,"apc_paid":null,"fwci":4.5953,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.97036665,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1131","last_page":"1138"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8209258317947388},{"id":"https://openalex.org/keywords/rope","display_name":"Rope","score":0.7860342860221863},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.773802638053894},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5616708397865295},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5576742887496948},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5127090215682983},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5048280358314514},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4719126522541046},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4664936065673828},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46062153577804565},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.45096710324287415},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3735503852367401},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.1449020504951477},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0804615318775177}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8209258317947388},{"id":"https://openalex.org/C162269090","wikidata":"https://www.wikidata.org/wiki/Q1156047","display_name":"Rope","level":2,"score":0.7860342860221863},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.773802638053894},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5616708397865295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5576742887496948},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5127090215682983},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5048280358314514},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4719126522541046},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4664936065673828},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46062153577804565},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.45096710324287415},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3735503852367401},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.1449020504951477},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0804615318775177},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros47612.2022.9981669","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981669","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2302.10446","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2302.10446","pdf_url":"https://arxiv.org/pdf/2302.10446","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2302.10446","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2302.10446","pdf_url":"https://arxiv.org/pdf/2302.10446","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4313060564.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W2083331227","https://openalex.org/W2418720700","https://openalex.org/W2953406320","https://openalex.org/W2955368974","https://openalex.org/W2962871243","https://openalex.org/W2963092423","https://openalex.org/W2966271811","https://openalex.org/W3003169307","https://openalex.org/W3004091482","https://openalex.org/W3012514211","https://openalex.org/W3035880432","https://openalex.org/W3040477237","https://openalex.org/W3104901003","https://openalex.org/W3130633756","https://openalex.org/W3159681073","https://openalex.org/W3164946289","https://openalex.org/W3200958309","https://openalex.org/W3203511201","https://openalex.org/W3207181464","https://openalex.org/W3210071715","https://openalex.org/W3210940825","https://openalex.org/W4297686387","https://openalex.org/W4385245566","https://openalex.org/W6739901393","https://openalex.org/W6752818329","https://openalex.org/W6765456200","https://openalex.org/W6774733536","https://openalex.org/W6785308759","https://openalex.org/W6785459237","https://openalex.org/W6787812375","https://openalex.org/W6794857441","https://openalex.org/W6801810553","https://openalex.org/W6801890467"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2382190654","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2041034200","https://openalex.org/W2373129217","https://openalex.org/W1924903628","https://openalex.org/W2375717371","https://openalex.org/W4390286213"],"abstract_inverted_index":{"Object":[0],"rearranging":[1,66,153],"is":[2,81,119,126,142],"one":[3],"of":[4,70,87],"the":[5,12,42,85,88],"most":[6],"common":[7],"deformable":[8,18,65],"manipulation":[9,62,130],"tasks,":[10,67],"where":[11],"robot":[13,165],"needs":[14],"to":[15,53,58,79,84,112,137,162],"rearrange":[16],"a":[17,21,55,98,163,168],"object":[19],"into":[20],"goal":[22],"configuration.":[23],"Previous":[24],"studies":[25],"focus":[26],"on":[27],"designing":[28],"an":[29],"expert":[30],"system":[31],"for":[32,64,121,128],"each":[33],"specific":[34],"task":[35],"by":[36,166],"model-based":[37],"or":[38],"data-driven":[39],"approaches":[40],"and":[41,124,150,157],"application":[43],"scenarios":[44],"are":[45],"therefore":[46],"limited.":[47],"Some":[48],"research":[49],"has":[50],"been":[51,135],"attempting":[52],"design":[54,97],"general":[56],"framework":[57,141],"obtain":[59],"more":[60],"advanced":[61],"capabilities":[63],"with":[68],"lots":[69],"progress":[71],"achieved":[72],"in":[73,144,155],"simulation.":[74],"However,":[75],"transferring":[76],"from":[77,116],"simulation":[78,156],"reality":[80],"difficult":[82],"due":[83],"limitation":[86],"end-to-end":[89],"CNN":[90],"architecture.":[91],"To":[92],"address":[93],"these":[94],"challenges,":[95],"we":[96],"local":[99],"GNN":[100],"(Graph":[101],"Neural":[102],"Network)":[103],"based":[104],"learning":[105],"method,":[106],"which":[107],"utilizes":[108],"two":[109],"representation":[110],"graphs":[111],"encode":[113],"keypoints":[114],"detected":[115],"images.":[117],"Self-attention":[118],"applied":[120,127],"graph":[122],"updating":[123],"cross-attention":[125],"generating":[129],"actions.":[131],"Extensive":[132],"experiments":[133],"have":[134],"conducted":[136],"demonstrate":[138],"that":[139],"our":[140],"effective":[143],"multiple":[145],"1-D":[146],"(rope,":[147],"rope":[148],"ring)":[149],"2-D":[151],"(cloth)":[152],"tasks":[154],"can":[158],"be":[159],"easily":[160],"transferred":[161],"real":[164],"fine-tuning":[167],"keypoint":[169],"detector.":[170]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-22T08:09:32.410652","created_date":"2025-10-10T00:00:00"}
