{"id":"https://openalex.org/W4288061557","doi":"https://doi.org/10.1109/access.2022.3176608","title":"M-A3C: A Mean-Asynchronous Advantage Actor-Critic Reinforcement Learning Method for Real-Time Gait Planning of Biped Robot","display_name":"M-A3C: A Mean-Asynchronous Advantage Actor-Critic Reinforcement Learning Method for Real-Time Gait Planning of Biped Robot","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4288061557","doi":"https://doi.org/10.1109/access.2022.3176608"},"language":"en","primary_location":{"id":"doi:10.1109/access.2022.3176608","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3176608","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9668973/09779214.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/9668973/09779214.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059650259","display_name":"Jie Leng","orcid":"https://orcid.org/0000-0002-0927-2200"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jie Leng","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060584388","display_name":"Suozhong Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suozhong Fan","raw_affiliation_strings":["Origin Dynamic Intelligent Robot Company Ltd., Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"Origin Dynamic Intelligent Robot Company Ltd., Zhengzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101681259","display_name":"Jun Tang","orcid":"https://orcid.org/0000-0001-8925-2367"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Tang","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048016214","display_name":"Haiming Mou","orcid":"https://orcid.org/0000-0001-9754-1214"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiming Mou","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051556369","display_name":"Junxiao Xue","orcid":"https://orcid.org/0000-0003-1569-5362"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junxiao Xue","raw_affiliation_strings":["School of Cyber Science and Engineering, Zhengzhou University, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Cyber Science and Engineering, Zhengzhou University, Zhengzhou, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021667837","display_name":"Qingdu Li","orcid":"https://orcid.org/0000-0001-9928-7272"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingdu Li","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5059650259"],"corresponding_institution_ids":["https://openalex.org/I148128674"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.9777,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.71442226,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"10","issue":null,"first_page":"76523","last_page":"76536"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7890194654464722},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.779904842376709},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7281762957572937},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5268387198448181},{"id":"https://openalex.org/keywords/gait","display_name":"Gait","score":0.5230777859687805},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4524865448474884},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3858301639556885},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3813811242580414},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.3808259963989258},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.13006219267845154},{"id":"https://openalex.org/keywords/physical-medicine-and-rehabilitation","display_name":"Physical medicine and rehabilitation","score":0.10870739817619324}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7890194654464722},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.779904842376709},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7281762957572937},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5268387198448181},{"id":"https://openalex.org/C151800584","wikidata":"https://www.wikidata.org/wiki/Q2370000","display_name":"Gait","level":2,"score":0.5230777859687805},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4524865448474884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3858301639556885},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3813811242580414},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3808259963989258},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.13006219267845154},{"id":"https://openalex.org/C99508421","wikidata":"https://www.wikidata.org/wiki/Q2678675","display_name":"Physical medicine and rehabilitation","level":1,"score":0.10870739817619324},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2022.3176608","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3176608","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9668973/09779214.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:172dfccdfd474603aca3146893330558","is_oa":true,"landing_page_url":"https://doaj.org/article/172dfccdfd474603aca3146893330558","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 10, Pp 76523-76536 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2022.3176608","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3176608","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9668973/09779214.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.6499999761581421,"display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4288061557.pdf","grobid_xml":"https://content.openalex.org/works/W4288061557.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W50292030","https://openalex.org/W1581909396","https://openalex.org/W1967204107","https://openalex.org/W1977655452","https://openalex.org/W2016102421","https://openalex.org/W2025121834","https://openalex.org/W2029058516","https://openalex.org/W2047174209","https://openalex.org/W2079995373","https://openalex.org/W2085978624","https://openalex.org/W2107726111","https://openalex.org/W2128131727","https://openalex.org/W2137300190","https://openalex.org/W2137547873","https://openalex.org/W2140764512","https://openalex.org/W2158013389","https://openalex.org/W2159443645","https://openalex.org/W2163668399","https://openalex.org/W2402164873","https://openalex.org/W2527645785","https://openalex.org/W2531377421","https://openalex.org/W2563122880","https://openalex.org/W2580909119","https://openalex.org/W2610901891","https://openalex.org/W2766447205","https://openalex.org/W2911087563","https://openalex.org/W3035118532","https://openalex.org/W3090041831","https://openalex.org/W3091282566","https://openalex.org/W3094888885","https://openalex.org/W3112952026","https://openalex.org/W3136437429","https://openalex.org/W3138010110","https://openalex.org/W3174748019","https://openalex.org/W3195824924","https://openalex.org/W3205983103","https://openalex.org/W3214016039","https://openalex.org/W4214717370","https://openalex.org/W6602037555","https://openalex.org/W6637967152","https://openalex.org/W6674304311","https://openalex.org/W6692846177"],"related_works":["https://openalex.org/W2742483371","https://openalex.org/W3096874164","https://openalex.org/W2166117066","https://openalex.org/W3087814763","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W4376605461","https://openalex.org/W4400868993","https://openalex.org/W2361647908","https://openalex.org/W2952356279"],"abstract_inverted_index":{"Bipedal":[0],"walking":[1,30,51,122],"is":[2,67,154],"a":[3,14,32,151],"challenging":[4],"task":[5],"for":[6,19],"humanoid":[7],"robots.":[8],"In":[9],"this":[10],"study,":[11],"we":[12,115],"develop":[13],"lightweight":[15],"reinforcement":[16,64],"learning":[17,65],"method":[18,172],"real-time":[20],"gait":[21,83,181],"planning":[22],"of":[23,46,84,96,124,132,146,162],"the":[24,36,41,44,50,56,71,81,85,89,106,110,117,121,125,130,135,139,144,147,160,163,170,175],"biped":[25,152,176],"robot.":[26],"We":[27,92],"regard":[28],"bipedal":[29],"as":[31],"process":[33],"in":[34,109],"which":[35],"robot":[37,86,127,153],"constantly":[38],"interacts":[39],"with":[40],"environment,":[42],"judges":[43],"quality":[45],"control":[47,57,123],"action":[48,76],"through":[49],"state,":[52],"and":[53,75,78,142,156,179],"then":[54],"adjusts":[55],"strategy.":[58],"A":[59],"mean-asynchronous":[60],"advantage":[61],"actor-critic":[62],"(M-A3C)":[63],"algorithm":[66,98],"proposed":[68,164,171],"to":[69,99,120,128,158],"obtain":[70,80],"continuous":[72,178],"state":[73],"space":[74],"space,":[77],"directly":[79],"final":[82,148],"without":[87],"introducing":[88],"reference":[90],"gait.":[91,149],"use":[93],"multiple":[94,101],"sub-agents":[95],"M-A3C":[97],"train":[100],"virtual":[102],"robots":[103],"independently":[104],"at":[105],"same":[107],"time":[108],"physical":[111],"simulation":[112],"platform.":[113],"Then":[114],"transfer":[116],"trained":[118],"model":[119],"actual":[126,136],"reduce":[129],"number":[131],"training":[133,140],"on":[134],"robot,":[137],"improve":[138],"speed,":[141],"ensure":[143],"acquisition":[145],"Finally,":[150],"designed":[155],"fabricated":[157],"verify":[159],"effectiveness":[161],"method.":[165],"Various":[166],"experiments":[167],"show":[168],"that":[169],"can":[173],"achieve":[174],"robot&#x2019;s":[177],"stable":[180],"planning.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
