{"id":"https://openalex.org/W3089580269","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207153","title":"Combining Reinforcement Learning and Rule-based Method to Manipulate Objects in Clutter","display_name":"Combining Reinforcement Learning and Rule-based Method to Manipulate Objects in Clutter","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3089580269","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207153","mag":"3089580269"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9207153","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207153","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://researchportal.port.ac.uk/portal/en/publications/combining-reinforcement-learning-and-rulebased-method-to-manipulate-objects-in-clutter(3f739f08-c245-44f6-bdd3-6a73567cdbc7).html","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100439332","display_name":"Yiwen Chen","orcid":"https://orcid.org/0009-0008-8053-2272"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yiwen Chen","raw_affiliation_strings":["School of Automation Science and Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Automation Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056287221","display_name":"Zhaojie Ju","orcid":"https://orcid.org/0000-0002-9524-7609"},"institutions":[{"id":"https://openalex.org/I63072094","display_name":"University of Portsmouth","ror":"https://ror.org/03ykbk197","country_code":"GB","type":"education","lineage":["https://openalex.org/I63072094"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhaojie Ju","raw_affiliation_strings":["School of Computing, University of Portsmouth, Portsmouth, UK"],"affiliations":[{"raw_affiliation_string":"School of Computing, University of Portsmouth, Portsmouth, UK","institution_ids":["https://openalex.org/I63072094"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019906827","display_name":"Chenguang Yang","orcid":"https://orcid.org/0000-0001-5255-5559"},"institutions":[{"id":"https://openalex.org/I178535277","display_name":"University of the West of England","ror":"https://ror.org/02nwg5t34","country_code":"GB","type":"education","lineage":["https://openalex.org/I178535277"]},{"id":"https://openalex.org/I4210161128","display_name":"Bristol Robotics Laboratory","ror":"https://ror.org/056sbyc67","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210161128"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chenguang Yang","raw_affiliation_strings":["Bristol Robotics Laboratory, University of the West of England, Bristol, UK"],"affiliations":[{"raw_affiliation_string":"Bristol Robotics Laboratory, University of the West of England, Bristol, UK","institution_ids":["https://openalex.org/I4210161128","https://openalex.org/I178535277"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100439332"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":1.785,"has_fulltext":true,"cited_by_count":21,"citation_normalized_percentile":{"value":0.84975451,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.924674391746521},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8129388093948364},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7568738460540771},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7056220173835754},{"id":"https://openalex.org/keywords/clutter","display_name":"Clutter","score":0.692718505859375},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6486230492591858},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.5259830355644226},{"id":"https://openalex.org/keywords/programming-by-demonstration","display_name":"Programming by demonstration","score":0.5100584626197815},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.48004138469696045},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.45085495710372925},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.449117511510849},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.44176262617111206},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33236733078956604},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.18231049180030823},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12276354432106018},{"id":"https://openalex.org/keywords/radar","display_name":"Radar","score":0.09943485260009766},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.07844102382659912},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07625752687454224}],"concepts":[{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.924674391746521},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8129388093948364},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7568738460540771},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7056220173835754},{"id":"https://openalex.org/C132094186","wikidata":"https://www.wikidata.org/wiki/Q641585","display_name":"Clutter","level":3,"score":0.692718505859375},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6486230492591858},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.5259830355644226},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.5100584626197815},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.48004138469696045},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.45085495710372925},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.449117511510849},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.44176262617111206},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33236733078956604},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.18231049180030823},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12276354432106018},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.09943485260009766},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.07844102382659912},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07625752687454224},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9207153","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207153","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:researchportal.port.ac.uk:publications/3f739f08-c245-44f6-bdd3-6a73567cdbc7","is_oa":true,"landing_page_url":null,"pdf_url":"https://researchportal.port.ac.uk/portal/en/publications/combining-reinforcement-learning-and-rulebased-method-to-manipulate-objects-in-clutter(3f739f08-c245-44f6-bdd3-6a73567cdbc7).html","source":{"id":"https://openalex.org/S4306401774","display_name":"Portsmouth Research Portal (University of Portsmouth)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63072094","host_organization_name":"University of Portsmouth","host_organization_lineage":["https://openalex.org/I63072094"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:researchportal.port.ac.uk:publications/3f739f08-c245-44f6-bdd3-6a73567cdbc7","is_oa":true,"landing_page_url":null,"pdf_url":"https://researchportal.port.ac.uk/portal/en/publications/combining-reinforcement-learning-and-rulebased-method-to-manipulate-objects-in-clutter(3f739f08-c245-44f6-bdd3-6a73567cdbc7).html","source":{"id":"https://openalex.org/S4306401774","display_name":"Portsmouth Research Portal (University of Portsmouth)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63072094","host_organization_name":"University of Portsmouth","host_organization_lineage":["https://openalex.org/I63072094"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1934935867","display_name":null,"funder_award_id":"Engineering and Physical Sciences R","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5842171993","display_name":null,"funder_award_id":"P/S001913","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G915687489","display_name":null,"funder_award_id":"EP/S001913","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W3089580269.pdf"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W1999156278","https://openalex.org/W2145339207","https://openalex.org/W2173248099","https://openalex.org/W2257979135","https://openalex.org/W2600030077","https://openalex.org/W2778092082","https://openalex.org/W2781726626","https://openalex.org/W2787938642","https://openalex.org/W2808844346","https://openalex.org/W2810785043","https://openalex.org/W2824754393","https://openalex.org/W2899508538","https://openalex.org/W2916933307","https://openalex.org/W2953431737","https://openalex.org/W2962736495","https://openalex.org/W2962759351","https://openalex.org/W2962793652","https://openalex.org/W2963033241","https://openalex.org/W2968095426","https://openalex.org/W2979421998","https://openalex.org/W2989940186","https://openalex.org/W3004003541"],"related_works":["https://openalex.org/W2577369411","https://openalex.org/W2147505856","https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W2944639335","https://openalex.org/W2643884694","https://openalex.org/W2165180011","https://openalex.org/W27526006"],"abstract_inverted_index":{"Picking":[0],"up":[1,43],"the":[2,30,44,60,67,78,83,100,109,126,130],"clustered":[3],"objects":[4,45,61],"is":[5,74,86,89,119],"always":[6],"a":[7,37,104,120,136,149],"challenging":[8],"task":[9],"in":[10,46],"robot":[11,18,68],"research":[12],"field.":[13],"And":[14],"reinforcement":[15,53,79],"learning":[16,54,80],"enables":[17],"to":[19,21,41],"adapt":[20],"different":[22],"tasks":[23],"through":[24],"plenty":[25],"of":[26,32,128],"attempts.":[27],"To":[28,58],"reduce":[29],"complexity":[31],"strategy":[33],"learning,":[34],"we":[35,64],"propose":[36],"framework":[38,146],"for":[39,108,138],"robots":[40],"pick":[42],"clutter":[47,161],"on":[48,51,62,125],"table":[49],"based":[50],"deep":[52],"and":[55],"rule-based":[56],"method.":[57],"manipulate":[59],"table,":[63],"mainly":[65],"divide":[66],"actions":[69],"into":[70],"two":[71],"categories:":[72],"one":[73,85],"pushing":[75,96,139],"that":[76,88],"uses":[77],"method,":[81],"while":[82],"other":[84],"grasping":[87],"inferred":[90],"by":[91],"image":[92],"morphological":[93],"processing.":[94],"The":[95,112],"action":[97],"can":[98,147],"separate":[99],"stacking":[101],"objects,":[102],"create":[103],"robust":[105],"grasp":[106,113,122,131,151],"point":[107],"following":[110],"grasp.":[111],"detect":[114,132],"algorithm":[115,133],"determines":[116],"if":[117],"there":[118],"suitable":[121],"point.":[123],"Judging":[124],"result":[127],"pushing,":[129],"will":[134],"return":[135],"reward":[137],"learning.":[140],"Taking":[141],"images":[142],"as":[143],"input,":[144],"our":[145],"keep":[148],"high":[150],"rate":[152],"with":[153],"low":[154],"computational":[155],"complexity,":[156],"which":[157],"makes":[158],"it":[159],"achieve":[160],"clearing":[162],"quickly.":[163]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
