{"id":"https://openalex.org/W3094602391","doi":"https://doi.org/10.1162/neco_a_01333","title":"Efficient Actor-Critic Reinforcement Learning With Embodiment of Muscle Tone for Posture Stabilization of the Human Arm","display_name":"Efficient Actor-Critic Reinforcement Learning With Embodiment of Muscle Tone for Posture Stabilization of the Human Arm","publication_year":2020,"publication_date":"2020-10-20","ids":{"openalex":"https://openalex.org/W3094602391","doi":"https://doi.org/10.1162/neco_a_01333","mag":"3094602391","pmid":"https://pubmed.ncbi.nlm.nih.gov/33080164"},"language":"en","primary_location":{"id":"doi:10.1162/neco_a_01333","is_oa":false,"landing_page_url":"https://doi.org/10.1162/neco_a_01333","pdf_url":null,"source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103087763","display_name":"Masami Iwamoto","orcid":"https://orcid.org/0000-0002-0738-521X"},"institutions":[{"id":"https://openalex.org/I4210165351","display_name":"Toyota Central Research and Development Laboratories (Japan)","ror":"https://ror.org/05mjgqe69","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4210165351"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Masami Iwamoto","raw_affiliation_strings":["Toyota Central R&D Labs., Aichi 480-1192 Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Toyota Central R&D Labs., Aichi 480-1192 Japan","institution_ids":["https://openalex.org/I4210165351"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103860365","display_name":"Daichi Kato","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165351","display_name":"Toyota Central Research and Development Laboratories (Japan)","ror":"https://ror.org/05mjgqe69","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4210165351"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Daichi Kato","raw_affiliation_strings":["Toyota Central R&D Labs., Aichi 480-1192 Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Toyota Central R&D Labs., Aichi 480-1192 Japan","institution_ids":["https://openalex.org/I4210165351"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5103087763","https://openalex.org/A5103860365"],"corresponding_institution_ids":["https://openalex.org/I4210165351"],"apc_list":null,"apc_paid":null,"fwci":0.1742,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.47717133,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"33","issue":"1","first_page":"129","last_page":"156"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10114","display_name":"Balance, Gait, and Falls Prevention","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/3612","display_name":"Physical Therapy, Sports Therapy and Rehabilitation"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/muscle-tone","display_name":"Muscle tone","score":0.6370581388473511},{"id":"https://openalex.org/keywords/midbrain","display_name":"Midbrain","score":0.6204513907432556},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6052374839782715},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.5587142705917358},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5493629574775696},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.48566973209381104},{"id":"https://openalex.org/keywords/tone","display_name":"Tone (literature)","score":0.4831194579601288},{"id":"https://openalex.org/keywords/motor-control","display_name":"Motor control","score":0.4509139657020569},{"id":"https://openalex.org/keywords/neurophysiology","display_name":"Neurophysiology","score":0.438780277967453},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42812037467956543},{"id":"https://openalex.org/keywords/muscle-tension","display_name":"Muscle tension","score":0.42276179790496826},{"id":"https://openalex.org/keywords/muscle-contraction","display_name":"Muscle contraction","score":0.4114339351654053},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.40842652320861816},{"id":"https://openalex.org/keywords/anatomy","display_name":"Anatomy","score":0.23220130801200867},{"id":"https://openalex.org/keywords/physical-medicine-and-rehabilitation","display_name":"Physical medicine and rehabilitation","score":0.21884164214134216},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.20659437775611877},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.1587815284729004},{"id":"https://openalex.org/keywords/central-nervous-system","display_name":"Central nervous system","score":0.13816264271736145}],"concepts":[{"id":"https://openalex.org/C2781375409","wikidata":"https://www.wikidata.org/wiki/Q1147377","display_name":"Muscle tone","level":2,"score":0.6370581388473511},{"id":"https://openalex.org/C552161191","wikidata":"https://www.wikidata.org/wiki/Q185080","display_name":"Midbrain","level":3,"score":0.6204513907432556},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6052374839782715},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.5587142705917358},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5493629574775696},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.48566973209381104},{"id":"https://openalex.org/C2780583480","wikidata":"https://www.wikidata.org/wiki/Q1366327","display_name":"Tone (literature)","level":2,"score":0.4831194579601288},{"id":"https://openalex.org/C137813230","wikidata":"https://www.wikidata.org/wiki/Q2996165","display_name":"Motor control","level":2,"score":0.4509139657020569},{"id":"https://openalex.org/C152478114","wikidata":"https://www.wikidata.org/wiki/Q660910","display_name":"Neurophysiology","level":2,"score":0.438780277967453},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42812037467956543},{"id":"https://openalex.org/C3018112276","wikidata":"https://www.wikidata.org/wiki/Q1147377","display_name":"Muscle tension","level":2,"score":0.42276179790496826},{"id":"https://openalex.org/C2776050358","wikidata":"https://www.wikidata.org/wiki/Q127006","display_name":"Muscle contraction","level":2,"score":0.4114339351654053},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.40842652320861816},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.23220130801200867},{"id":"https://openalex.org/C99508421","wikidata":"https://www.wikidata.org/wiki/Q2678675","display_name":"Physical medicine and rehabilitation","level":1,"score":0.21884164214134216},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.20659437775611877},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.1587815284729004},{"id":"https://openalex.org/C529278444","wikidata":"https://www.wikidata.org/wiki/Q47273","display_name":"Central nervous system","level":2,"score":0.13816264271736145},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000294","qualifier_name":"innervation","is_major_topic":true},{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000294","qualifier_name":"innervation","is_major_topic":true},{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000294","qualifier_name":"innervation","is_major_topic":true},{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D001132","descriptor_name":"Arm","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D008297","descriptor_name":"Male","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008297","descriptor_name":"Male","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008297","descriptor_name":"Male","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009129","descriptor_name":"Muscle Tonus","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D009129","descriptor_name":"Muscle Tonus","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D009129","descriptor_name":"Muscle Tonus","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D011187","descriptor_name":"Posture","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D011187","descriptor_name":"Posture","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D011187","descriptor_name":"Posture","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1162/neco_a_01333","is_oa":false,"landing_page_url":"https://doi.org/10.1162/neco_a_01333","pdf_url":null,"source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computation","raw_type":"journal-article"},{"id":"pmid:33080164","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33080164","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural computation","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W39204140","https://openalex.org/W618252706","https://openalex.org/W1549114171","https://openalex.org/W1553636676","https://openalex.org/W1583837637","https://openalex.org/W1585565342","https://openalex.org/W1607052939","https://openalex.org/W1985358067","https://openalex.org/W1999668087","https://openalex.org/W2007487015","https://openalex.org/W2024793907","https://openalex.org/W2030092661","https://openalex.org/W2058841421","https://openalex.org/W2060052647","https://openalex.org/W2066133489","https://openalex.org/W2083027767","https://openalex.org/W2090252028","https://openalex.org/W2103756351","https://openalex.org/W2105078254","https://openalex.org/W2113501460","https://openalex.org/W2119578126","https://openalex.org/W2137352160","https://openalex.org/W2143200554","https://openalex.org/W2151906934","https://openalex.org/W2158782408","https://openalex.org/W2160485507","https://openalex.org/W2170793212","https://openalex.org/W2288407417","https://openalex.org/W2577370916","https://openalex.org/W2791988095","https://openalex.org/W4392663065"],"related_works":["https://openalex.org/W2014878821","https://openalex.org/W2970161502","https://openalex.org/W2046958837","https://openalex.org/W4240453644","https://openalex.org/W2888156133","https://openalex.org/W2349945758","https://openalex.org/W2224906852","https://openalex.org/W2038464227","https://openalex.org/W2364759712","https://openalex.org/W2177751330"],"abstract_inverted_index":{"This":[0],"letter":[1],"proposes":[2],"a":[3,20,58,140,247],"new":[4],"idea":[5],"to":[6,37,56,76,90,153,208],"improve":[7],"learning":[8,12,262,265,286],"efficiency":[9,287],"in":[10,41,81,139,223,238,253,288],"reinforcement":[11],"(RL)":[13],"with":[14,226],"the":[15,27,91,104,114,127,149,154,161,171,203,206,210,218,221,229,243,264,277],"actor-critic":[16],"method":[17],"used":[18,34],"as":[19,135],"muscle":[21,46,60,110,120,167,215,232,282],"controller":[22],"for":[23,35,63,185,199],"posture":[24,39,236,289],"stabilization":[25,237,290],"of":[26,84,93,130,174,177,195,213,220,231,242,246,261,279,281,292],"human":[28,248],"arm.":[29],"Actor-critic":[30],"RL":[31],"(ACRL)":[32],"is":[33,74],"simulations":[36],"realize":[38],"controls":[40,80],"humans":[42,293],"or":[43,87,102,294],"robots":[44],"using":[45,100,181],"tension":[47],"control.":[48],"However,":[49],"it":[50],"requires":[51],"very":[52],"high":[53],"computational":[54],"costs":[55],"acquire":[57],"better":[59],"control":[61,95,144,166],"policy":[62],"desirable":[64],"postures.":[65],"For":[66],"efficient":[67,79],"ACRL,":[68],"we":[69,158,189],"focused":[70],"on":[71,217],"embodiment":[72,230,280],"that":[73,160,169,276],"supposed":[75],"potentially":[77],"achieve":[78],"research":[82],"fields":[83],"artificial":[85],"intelligence":[86],"robotics.":[88],"According":[89],"neurophysiology":[92],"motion":[94],"obtained":[96,271],"from":[97,148,272],"experimental":[98],"studies":[99],"animals":[101],"humans,":[103],"pedunculopontine":[105],"tegmental":[106],"nucleus":[107],"(PPTn)":[108],"induces":[109,119],"tone":[111,121,233,283],"suppression,":[112],"and":[113,124,137,163,197],"midbrain":[115],"locomotor":[116],"region":[117],"(MLR)":[118],"promotion.":[122],"PPTn":[123,162,196],"MLR":[125,164,198],"modulate":[126],"activation":[128,175,211],"levels":[129,176],"mutually":[131,178],"antagonizing":[132,179],"muscles":[133,180],"such":[134],"flexors":[136],"extensors":[138],"process":[141,207],"through":[142],"which":[143],"signals":[145],"are":[146],"translated":[147],"substantia":[150],"nigra":[151],"reticulata":[152],"brain":[155],"stem.":[156],"Therefore,":[157],"hypothesized":[159],"could":[165],"tone,":[168],"is,":[170],"maximum":[172],"values":[173],"different":[182],"sigmoidal":[183],"functions":[184],"each":[186,214],"muscle;":[187],"then":[188],"introduced":[190],"antagonism":[191],"function":[192],"models":[193],"(AFMs)":[194],"individual":[200],"muscles,":[201],"incorporating":[202],"hypothesis":[204],"into":[205],"determine":[209],"level":[212],"based":[216],"output":[219],"actor":[222],"ACRL.":[224],"ACRL":[225],"AFMs":[227],"representing":[228],"successfully":[234],"achieved":[235],"five":[239],"joint":[240],"motions":[241],"right":[244],"arm":[245],"adult":[249],"male":[250],"under":[251],"gravity":[252],"predetermined":[254],"target":[255],"angles":[256],"at":[257],"an":[258],"earlier":[259],"period":[260],"than":[263],"methods":[266],"without":[267],"AFMs.":[268],"The":[269],"results":[270],"this":[273],"study":[274],"suggest":[275],"introduction":[278],"can":[284],"enhance":[285],"disorders":[291],"humanoid":[295],"robots.":[296]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
