{"id":"https://openalex.org/W3176770340","doi":"https://doi.org/10.1109/lra.2021.3092640","title":"Efficient Learning of Goal-Oriented Push-Grasping Synergy in Clutter","display_name":"Efficient Learning of Goal-Oriented Push-Grasping Synergy in Clutter","publication_year":2021,"publication_date":"2021-06-28","ids":{"openalex":"https://openalex.org/W3176770340","doi":"https://doi.org/10.1109/lra.2021.3092640","mag":"3176770340"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2021.3092640","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2021.3092640","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062930488","display_name":"Kechun Xu","orcid":"https://orcid.org/0000-0002-3632-917X"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Kechun Xu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I55712492","https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046531091","display_name":"Hongxiang Yu","orcid":"https://orcid.org/0000-0003-1417-0476"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongxiang Yu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I55712492","https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081752951","display_name":"Qianen Lai","orcid":null},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianen Lai","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I55712492","https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100371992","display_name":"Yue Wang","orcid":"https://orcid.org/0000-0002-0981-935X"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Wang","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I55712492","https://openalex.org/I4391767838"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019081110","display_name":"Rong Xiong","orcid":"https://orcid.org/0000-0001-9318-9014"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rong Xiong","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, and Institute of Cyber-Systems and Control, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I55712492","https://openalex.org/I4391767838"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5062930488"],"corresponding_institution_ids":["https://openalex.org/I4391767838","https://openalex.org/I55712492"],"apc_list":null,"apc_paid":null,"fwci":8.8502,"has_fulltext":false,"cited_by_count":84,"citation_normalized_percentile":{"value":0.98414327,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"6","issue":"4","first_page":"6337","last_page":"6344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.8539076447486877},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7350739240646362},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.705964982509613},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5971080660820007},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5877816081047058},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5762557983398438},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.551243245601654},{"id":"https://openalex.org/keywords/clutter","display_name":"Clutter","score":0.5512264966964722},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.530666172504425},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5201961994171143},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4934769868850708},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.43328163027763367},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.365805983543396},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35155758261680603},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18663707375526428},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.1052527129650116}],"concepts":[{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.8539076447486877},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7350739240646362},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.705964982509613},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5971080660820007},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5877816081047058},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5762557983398438},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.551243245601654},{"id":"https://openalex.org/C132094186","wikidata":"https://www.wikidata.org/wiki/Q641585","display_name":"Clutter","level":3,"score":0.5512264966964722},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.530666172504425},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5201961994171143},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4934769868850708},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.43328163027763367},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.365805983543396},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35155758261680603},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18663707375526428},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.1052527129650116},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2021.3092640","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2021.3092640","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1665214252","https://openalex.org/W1836465849","https://openalex.org/W1903029394","https://openalex.org/W1981667747","https://openalex.org/W2005824379","https://openalex.org/W2036637075","https://openalex.org/W2082511574","https://openalex.org/W2108598243","https://openalex.org/W2201912979","https://openalex.org/W2296360731","https://openalex.org/W2405660904","https://openalex.org/W2600030077","https://openalex.org/W2736534894","https://openalex.org/W2773721443","https://openalex.org/W2789805345","https://openalex.org/W2889969363","https://openalex.org/W2904207885","https://openalex.org/W2962793652","https://openalex.org/W2962889474","https://openalex.org/W2963446712","https://openalex.org/W2963646405","https://openalex.org/W2964001908","https://openalex.org/W2967068439","https://openalex.org/W2969014098","https://openalex.org/W3004047800","https://openalex.org/W3004091482","https://openalex.org/W3021544315","https://openalex.org/W3089580269","https://openalex.org/W3089949728","https://openalex.org/W3090679498","https://openalex.org/W3097484130","https://openalex.org/W3112422759","https://openalex.org/W3132114951","https://openalex.org/W3205918749","https://openalex.org/W4211241511","https://openalex.org/W4300799055","https://openalex.org/W6637242042","https://openalex.org/W6638667902","https://openalex.org/W6714057483","https://openalex.org/W6740801417","https://openalex.org/W6741140343","https://openalex.org/W6746713385","https://openalex.org/W6781789155","https://openalex.org/W6784840303","https://openalex.org/W6786218831"],"related_works":["https://openalex.org/W4293202849","https://openalex.org/W1980965563","https://openalex.org/W1489300767","https://openalex.org/W4380714744","https://openalex.org/W2387995142","https://openalex.org/W4319453655","https://openalex.org/W2057775761","https://openalex.org/W2964074194","https://openalex.org/W2089959425","https://openalex.org/W2163296013"],"abstract_inverted_index":{"We":[0],"focus":[1],"on":[2],"the":[3,38,49,58,62,125,129,144,152,162,252],"task":[4,216],"of":[5,64,151,164,172,190,227],"goal-oriented":[6],"grasping,":[7],"in":[8,20,35,74,102,186,194,215],"which":[9],"a":[10,16,71,80,94,99,117,138,141],"robot":[11,39],"is":[12,90,109,147,179,260],"supposed":[13],"to":[14,30,92,123,181,238,251],"grasp":[15,221],"pre-assigned":[17],"goal":[18,50,121,220],"object":[19,101],"clutter":[21],"and":[22,55,131,140,143,184,196,208,211,219],"needs":[23],"some":[24],"pre-grasp":[25],"actions":[26],"such":[27],"as":[28,137],"pushes":[29],"enable":[31],"stable":[32],"grasps.":[33],"However,":[34],"this":[36,75,78],"task,":[37],"gets":[40],"positive":[41],"rewards":[42],"from":[43],"environment":[44],"only":[45],"when":[46],"successfully":[47],"grasping":[48,56,98,132,153,185,209],"object.":[51],"Besides,":[52],"joint":[53],"pushing":[54,130,145,157,183,207],"elongates":[57],"action":[59],"sequence,":[60],"compounding":[61],"problem":[63,163],"reward":[65],"delay.":[66],"Thus,":[67],"sample":[68,88,107],"inefficiency":[69],"remains":[70],"main":[72],"challenge":[73],"task.":[76],"In":[77,104],"letter,":[79],"goal-conditioned":[81,118],"hierarchical":[82],"reinforcement":[83],"learning":[84],"formulation":[85],"with":[86,149,161,241],"high":[87],"efficiency":[89,108],"proposed":[91],"learn":[93,182,205],"push-grasping":[95],"policy":[96,146],"for":[97],"specific":[100],"clutter.":[103],"our":[105,201,233,246],"work,":[106],"improved":[110],"by":[111,120,168,224],"two":[112,173],"means.":[113],"First,":[114],"we":[115,230],"use":[116],"mechanism":[119],"relabeling":[122],"enrich":[124],"replay":[126],"buffer.":[127],"Second,":[128],"policies":[133,210],"are":[134],"respectively":[135],"regarded":[136],"generator":[139],"discriminator":[142],"trained":[148],"supervision":[150],"discriminator,":[154],"thus":[155],"densifying":[156],"rewards.":[158],"To":[159],"deal":[160],"distribution":[165],"mismatch":[166],"caused":[167],"different":[169],"training":[170,177],"settings":[171],"policies,":[174],"an":[175],"alternating":[176],"stage":[178],"added":[180],"turn.":[187],"A":[188],"series":[189],"experiments":[191],"carried":[192],"out":[193],"simulation":[195],"real":[197,253],"world":[198,254],"indicate":[199],"that":[200,232,245],"method":[202],"can":[203,235,248],"quickly":[204],"effective":[206],"outperforms":[212],"existing":[213],"methods":[214],"completion":[217],"rate":[218,223],"success":[222],"less":[225],"times":[226],"motion.":[228],"Furthermore,":[229],"validate":[231],"system":[234,247],"also":[236],"adapt":[237],"goal-agnostic":[239],"conditions":[240],"better":[242],"performance.":[243],"Note":[244],"be":[249],"transferred":[250],"without":[255],"any":[256],"fine-tuning.":[257],"Our":[258],"code":[259],"available":[261],"at":[262],"https://github.com/xukechun/Efficient_goal-oriented_push-grasping_synergy":[263]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":32},{"year":2023,"cited_by_count":19},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
