{"id":"https://openalex.org/W2766702649","doi":"https://doi.org/10.1007/978-3-319-70139-4_44","title":"A Linear Online Guided Policy Search Algorithm","display_name":"A Linear Online Guided Policy Search Algorithm","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2766702649","doi":"https://doi.org/10.1007/978-3-319-70139-4_44","mag":"2766702649"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-319-70139-4_44","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-319-70139-4_44","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101979437","display_name":"Biao Sun","orcid":"https://orcid.org/0000-0001-6677-8673"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Biao Sun","raw_affiliation_strings":["The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","University of Science and Technology Beijing, Beijing, 100083, China"],"affiliations":[{"raw_affiliation_string":"The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210094879"]},{"raw_affiliation_string":"University of Science and Technology Beijing, Beijing, 100083, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056039500","display_name":"Fangzhou Xiong","orcid":"https://orcid.org/0000-0002-2592-4096"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangzhou Xiong","raw_affiliation_strings":["School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100434504","display_name":"Zhiyong Liu","orcid":"https://orcid.org/0000-0003-2148-1846"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210144487","display_name":"Cloud Computing Center","ror":"https://ror.org/04aa0zm65","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210144487"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Liu","raw_affiliation_strings":["CAS Centre for Excellence in Brain Science and Intelligence Technology (CEBSIT), Shanghai, 200031, China","Cloud Computing Center, Chinese Academy of Sciences, DongGuan, 523808, Guandong, China","School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China"],"affiliations":[{"raw_affiliation_string":"CAS Centre for Excellence in Brain Science and Intelligence Technology (CEBSIT), Shanghai, 200031, China","institution_ids":["https://openalex.org/I4210097554"]},{"raw_affiliation_string":"Cloud Computing Center, Chinese Academy of Sciences, DongGuan, 523808, Guandong, China","institution_ids":["https://openalex.org/I4210144487"]},{"raw_affiliation_string":"School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007963696","display_name":"Xu Yang","orcid":"https://orcid.org/0000-0003-0553-4581"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Yang","raw_affiliation_strings":["The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China"],"affiliations":[{"raw_affiliation_string":"The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026688050","display_name":"Hong Qiao","orcid":"https://orcid.org/0000-0001-6384-3687"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]},{"id":"https://openalex.org/I4210144487","display_name":"Cloud Computing Center","ror":"https://ror.org/04aa0zm65","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210144487"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Qiao","raw_affiliation_strings":["CAS Centre for Excellence in Brain Science and Intelligence Technology (CEBSIT), Shanghai, 200031, China","Cloud Computing Center, Chinese Academy of Sciences, DongGuan, 523808, Guandong, China","School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","University of Science and Technology Beijing, Beijing, 100083, China"],"affiliations":[{"raw_affiliation_string":"CAS Centre for Excellence in Brain Science and Intelligence Technology (CEBSIT), Shanghai, 200031, China","institution_ids":["https://openalex.org/I4210097554"]},{"raw_affiliation_string":"Cloud Computing Center, Chinese Academy of Sciences, DongGuan, 523808, Guandong, China","institution_ids":["https://openalex.org/I4210144487"]},{"raw_affiliation_string":"School of Computer and Control, University of Chinese Academy of Sciences (UCAS), Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"The State Key Lab of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Science, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210094879"]},{"raw_affiliation_string":"University of Science and Technology Beijing, Beijing, 100083, China","institution_ids":["https://openalex.org/I92403157"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101979437"],"corresponding_institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I92403157"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.16841766,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"434","last_page":"441"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.791185736656189},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7562538385391235},{"id":"https://openalex.org/keywords/witness","display_name":"Witness","score":0.6540415287017822},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6471377611160278},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6318738460540771},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5879796147346497},{"id":"https://openalex.org/keywords/global-positioning-system","display_name":"Global Positioning System","score":0.5674146413803101},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4449272155761719},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4286215305328369},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35751235485076904},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.35655850172042847},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3264387547969818},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10917890071868896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.791185736656189},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7562538385391235},{"id":"https://openalex.org/C2776900844","wikidata":"https://www.wikidata.org/wiki/Q8028383","display_name":"Witness","level":2,"score":0.6540415287017822},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6471377611160278},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6318738460540771},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5879796147346497},{"id":"https://openalex.org/C60229501","wikidata":"https://www.wikidata.org/wiki/Q18822","display_name":"Global Positioning System","level":2,"score":0.5674146413803101},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4449272155761719},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4286215305328369},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35751235485076904},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.35655850172042847},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3264387547969818},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10917890071868896},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-319-70139-4_44","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-319-70139-4_44","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1519626139","https://openalex.org/W1731081199","https://openalex.org/W2012587148","https://openalex.org/W2051620263","https://openalex.org/W2098284983","https://openalex.org/W2100235553","https://openalex.org/W2104733512","https://openalex.org/W2121103318","https://openalex.org/W2152740345","https://openalex.org/W2163533082","https://openalex.org/W2529601334","https://openalex.org/W2963630259","https://openalex.org/W2964161785","https://openalex.org/W3146846077","https://openalex.org/W6653548176"],"related_works":["https://openalex.org/W2890518300","https://openalex.org/W2366687089","https://openalex.org/W2468279273","https://openalex.org/W588843504","https://openalex.org/W2382947717","https://openalex.org/W4302574074","https://openalex.org/W2354198838","https://openalex.org/W2360970878","https://openalex.org/W2382362122","https://openalex.org/W2390813549"],"abstract_inverted_index":null,"counts_by_year":[{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
