{"id":"https://openalex.org/W4388451010","doi":"https://doi.org/10.1109/access.2023.3330782","title":"Sim-to-Real Transfer Reinforcement Learning for Position Control of Pneumatic Continuum Manipulator","display_name":"Sim-to-Real Transfer Reinforcement Learning for Position Control of Pneumatic Continuum Manipulator","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4388451010","doi":"https://doi.org/10.1109/access.2023.3330782"},"language":"en","primary_location":{"id":"doi:10.1109/access.2023.3330782","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3330782","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10310215.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10310215.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100767867","display_name":"Qiang Cheng","orcid":"https://orcid.org/0000-0002-0024-3438"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qiang Cheng","raw_affiliation_strings":["School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077459922","display_name":"Hongshuai Liu","orcid":"https://orcid.org/0000-0003-2515-0059"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongshuai Liu","raw_affiliation_strings":["Suzhou Automotive Research Institute (Xiangcheng), Tsinghua University, Suzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-2515-0059","affiliations":[{"raw_affiliation_string":"Suzhou Automotive Research Institute (Xiangcheng), Tsinghua University, Suzhou, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030425830","display_name":"Xifeng Gao","orcid":"https://orcid.org/0000-0002-0580-6893"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I890469752","display_name":"Ministry of Industry and Information Technology","ror":"https://ror.org/0385nmy68","country_code":"CN","type":"government","lineage":["https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xifeng Gao","raw_affiliation_strings":["Center of Ultra-Precision Optoelectronic Instrumentation Engineering, Harbin Institute of Technology, Harbin, China","Key Lab of Ultra-Precision Intelligent Instrumentation, Ministry of Industry Information Technology, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0002-0580-6893","affiliations":[{"raw_affiliation_string":"Center of Ultra-Precision Optoelectronic Instrumentation Engineering, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Key Lab of Ultra-Precision Intelligent Instrumentation, Ministry of Industry Information Technology, Harbin, China","institution_ids":["https://openalex.org/I890469752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100386114","display_name":"Ying Zhang","orcid":"https://orcid.org/0000-0002-3091-3973"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Zhang","raw_affiliation_strings":["School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067701874","display_name":"Lina Hao","orcid":"https://orcid.org/0000-0001-8791-2253"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lina Hao","raw_affiliation_strings":["School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0001-8791-2253","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering and Automation, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100767867"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.1062,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.41818248,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"11","issue":null,"first_page":"126110","last_page":"126118"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11372","display_name":"Hydraulic and Pneumatic Systems","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6757041811943054},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5670607089996338},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5637164115905762},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.4865947961807251},{"id":"https://openalex.org/keywords/pneumatic-actuator","display_name":"Pneumatic actuator","score":0.4304426312446594},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3708408772945404},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34676122665405273},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3354567289352417},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1929502785205841},{"id":"https://openalex.org/keywords/actuator","display_name":"Actuator","score":0.15210846066474915}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6757041811943054},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5670607089996338},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5637164115905762},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.4865947961807251},{"id":"https://openalex.org/C170401851","wikidata":"https://www.wikidata.org/wiki/Q1965061","display_name":"Pneumatic actuator","level":3,"score":0.4304426312446594},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3708408772945404},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34676122665405273},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3354567289352417},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1929502785205841},{"id":"https://openalex.org/C172707124","wikidata":"https://www.wikidata.org/wiki/Q423488","display_name":"Actuator","level":2,"score":0.15210846066474915},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2023.3330782","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3330782","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10310215.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b906ccfacafe4dfea399ab4070acd8c9","is_oa":true,"landing_page_url":"https://doaj.org/article/b906ccfacafe4dfea399ab4070acd8c9","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 11, Pp 126110-126118 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2023.3330782","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3330782","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10310215.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1759495156","display_name":null,"funder_award_id":"52305569","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2768436946","display_name":null,"funder_award_id":"62103090","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4476734651","display_name":null,"funder_award_id":"62073063","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388451010.pdf","grobid_xml":"https://content.openalex.org/works/W4388451010.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W1515749184","https://openalex.org/W1891615552","https://openalex.org/W2095462685","https://openalex.org/W2096645690","https://openalex.org/W2101667962","https://openalex.org/W2145339207","https://openalex.org/W2179284380","https://openalex.org/W2530944449","https://openalex.org/W2605102758","https://openalex.org/W2775361682","https://openalex.org/W2901112449","https://openalex.org/W2910273746","https://openalex.org/W2963864421","https://openalex.org/W2967429195","https://openalex.org/W3008009191","https://openalex.org/W3012402823","https://openalex.org/W3033227671","https://openalex.org/W3035790680","https://openalex.org/W3127125587","https://openalex.org/W4224831007","https://openalex.org/W4286893196","https://openalex.org/W6684921986","https://openalex.org/W6728367041","https://openalex.org/W6774495894","https://openalex.org/W6803128367"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2617064325","https://openalex.org/W2277095232"],"abstract_inverted_index":{"Reinforcement":[0],"learning(RL)":[1],"is":[2,30,61,94,102,117,144,165],"attempted":[3],"to":[4,7,37,63,119,126,158,171],"be":[5,57,156],"applied":[6,157],"the":[8,15,24,27,38,41,44,47,50,54,64,79,91,97,121,128,131,136,148,150,159,173,176],"control":[9,28,81,122],"of":[10,14,20,49,82,90,100,130,175],"continuum":[11,84],"robots.":[12],"Because":[13],"inefficiency":[16],"and":[17,43,73,112],"high":[18],"cost":[19],"collecting":[21],"samples":[22],"in":[23,33,53,134,153],"real":[25,45,65,160],"world,":[26,46],"strategy":[29,51,71,132,142,151],"usually":[31],"learned":[32,52,133,152],"simulation.":[34],"However,":[35],"due":[36],"gap":[39],"between":[40],"simulation":[42,55,98,154],"performance":[48],"will":[56],"reduced":[58],"when":[59],"it":[60],"transferred":[62],"world.":[66,161],"This":[67],"paper":[68],"proposes":[69],"a":[70,169],"learning":[72,113],"Simulation-to-Real":[74],"(Sim-to-Real)":[75],"transfer":[76,138],"framework":[77],"for":[78,114],"position":[80],"pneumatic":[83],"manipulator":[85],"(PCM).":[86],"The":[87,109],"dynamics":[88],"model":[89],"PCM,":[92],"which":[93],"used":[95,118],"as":[96],"environment":[99],"RL,":[101],"represented":[103],"by":[104],"long":[105],"short-term":[106],"memory":[107],"(LSTM).":[108],"probabilistic":[110],"inference":[111],"control(PILCO":[115],")":[116],"train":[120],"strategy.":[123],"In":[124],"order":[125],"utilize":[127],"information":[129],"simulation,":[135],"Sim-to-Real":[137],"method":[139],"based":[140],"on":[141,168],"fine-tuning":[143,147],"proposed.":[145],"By":[146],"strategy,":[149],"can":[155],"Finally,":[162],"an":[163],"experiment":[164],"carried":[166],"out":[167],"PCM":[170],"verify":[172],"effectiveness":[174],"proposed":[177],"framework.":[178]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
