{"id":"https://openalex.org/W3205734604","doi":"https://doi.org/10.1007/978-3-030-89098-8_14","title":"Learning Robot Grasping from a Random Pile with Deep Q-Learning","display_name":"Learning Robot Grasping from a Random Pile with Deep Q-Learning","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3205734604","doi":"https://doi.org/10.1007/978-3-030-89098-8_14","mag":"3205734604"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-89098-8_14","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-89098-8_14","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100427335","display_name":"Bin Chen","orcid":"https://orcid.org/0000-0002-3979-021X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bin Chen","raw_affiliation_strings":["State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","University of Chinese Academy of Sciences, Beijing, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210094879"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112188599","display_name":"Jianhua Su","orcid":"https://orcid.org/0000-0002-3865-0493"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Su","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, People's Republic of China","State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051585653","display_name":"Lili Wang","orcid":"https://orcid.org/0000-0002-0422-4277"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lili Wang","raw_affiliation_strings":["State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","University of Chinese Academy of Sciences, Beijing, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210094879"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017003276","display_name":"Qipeng Gu","orcid":"https://orcid.org/0000-0002-3151-6486"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qipeng Gu","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, People's Republic of China","State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Lab. of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, People's Republic of China","institution_ids":["https://openalex.org/I4210094879"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100427335"],"corresponding_institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I4210165038"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":1.8521,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.85524546,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"142","last_page":"152"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9828000068664551,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7804477214813232},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.7739880084991455},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.743703305721283},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7324531674385071},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.638039231300354},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6094210743904114},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5524406433105469},{"id":"https://openalex.org/keywords/pile","display_name":"Pile","score":0.5268213748931885},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.49721482396125793},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48391109704971313},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4700794517993927},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.4193386137485504},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4135507047176361},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34299522638320923},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16820093989372253}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7804477214813232},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.7739880084991455},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.743703305721283},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7324531674385071},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.638039231300354},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6094210743904114},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5524406433105469},{"id":"https://openalex.org/C119560385","wikidata":"https://www.wikidata.org/wiki/Q7193850","display_name":"Pile","level":2,"score":0.5268213748931885},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.49721482396125793},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48391109704971313},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4700794517993927},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.4193386137485504},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4135507047176361},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34299522638320923},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16820093989372253},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-030-89098-8_14","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-89098-8_14","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W169931978","https://openalex.org/W2006833873","https://openalex.org/W2036637075","https://openalex.org/W2041376653","https://openalex.org/W2108598243","https://openalex.org/W2145339207","https://openalex.org/W2151584099","https://openalex.org/W2159290603","https://openalex.org/W2194775991","https://openalex.org/W2201912979","https://openalex.org/W2257979135","https://openalex.org/W2575705757","https://openalex.org/W2775954438","https://openalex.org/W2910474428","https://openalex.org/W2914656440","https://openalex.org/W2962736495","https://openalex.org/W2962793652","https://openalex.org/W2963276406","https://openalex.org/W2963390419","https://openalex.org/W2964198579","https://openalex.org/W2993843460","https://openalex.org/W3112422759","https://openalex.org/W6603326339","https://openalex.org/W6824051750"],"related_works":["https://openalex.org/W2742483371","https://openalex.org/W3096874164","https://openalex.org/W2166117066","https://openalex.org/W3087814763","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W4376605461","https://openalex.org/W4400868993","https://openalex.org/W2361647908","https://openalex.org/W2952356279"],"abstract_inverted_index":null,"counts_by_year":[{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
