{"id":"https://openalex.org/W4409102059","doi":"https://doi.org/10.1109/jiot.2025.3557007","title":"Optimized Impedance Control for Biped Robots in IUA Using Reinforcement Learning and Quadratic Programming","display_name":"Optimized Impedance Control for Biped Robots in IUA Using Reinforcement Learning and Quadratic Programming","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409102059","doi":"https://doi.org/10.1109/jiot.2025.3557007"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2025.3557007","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3557007","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037626649","display_name":"Yunfeng Hou","orcid":"https://orcid.org/0000-0001-9531-902X"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunfeng Hou","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071921583","display_name":"Jun Tang","orcid":"https://orcid.org/0000-0002-5819-7083"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Tang","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100622932","display_name":"Zhiyuan Ma","orcid":"https://orcid.org/0000-0003-2153-5824"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyuan Ma","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104473592","display_name":"Jialong Li","orcid":"https://orcid.org/0000-0003-4327-1807"},"institutions":[{"id":"https://openalex.org/I148128674","display_name":"University of Shanghai for Science and Technology","ror":"https://ror.org/00ay9v204","country_code":"CN","type":"education","lineage":["https://openalex.org/I148128674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialong Li","raw_affiliation_strings":["Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Machine Intelligence, University of Shanghai for Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I148128674"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100318147","display_name":"Wei Li","orcid":"https://orcid.org/0000-0002-2621-1821"},"institutions":[{"id":"https://openalex.org/I146613903","display_name":"Shanghai Lixin University of Accounting and Finance","ror":"https://ror.org/02g81yf77","country_code":"CN","type":"education","lineage":["https://openalex.org/I146613903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Li","raw_affiliation_strings":["School of Finance, Shanghai Lixin University of Accounting and Finance, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Finance, Shanghai Lixin University of Accounting and Finance, Shanghai, China","institution_ids":["https://openalex.org/I146613903"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5037626649"],"corresponding_institution_ids":["https://openalex.org/I148128674"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06139129,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12810","display_name":"Real-time simulation and control systems","score":0.9815000295639038,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9279000163078308,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7632416486740112},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7600294351577759},{"id":"https://openalex.org/keywords/quadratic-programming","display_name":"Quadratic programming","score":0.6161811947822571},{"id":"https://openalex.org/keywords/electrical-impedance","display_name":"Electrical impedance","score":0.47392258048057556},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.47161605954170227},{"id":"https://openalex.org/keywords/impedance-control","display_name":"Impedance control","score":0.4600415825843811},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.45877963304519653},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4191013276576996},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3811982274055481},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3213489353656769},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2718116044998169},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11752080917358398},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11074572801589966},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.07488396763801575}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7632416486740112},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7600294351577759},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.6161811947822571},{"id":"https://openalex.org/C17829176","wikidata":"https://www.wikidata.org/wiki/Q179043","display_name":"Electrical impedance","level":2,"score":0.47392258048057556},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.47161605954170227},{"id":"https://openalex.org/C2777984285","wikidata":"https://www.wikidata.org/wiki/Q17098134","display_name":"Impedance control","level":3,"score":0.4600415825843811},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.45877963304519653},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4191013276576996},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3811982274055481},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3213489353656769},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2718116044998169},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11752080917358398},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11074572801589966},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.07488396763801575},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jiot.2025.3557007","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3557007","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3732979887","display_name":null,"funder_award_id":"62403323","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1496975397","https://openalex.org/W1957820804","https://openalex.org/W1991087840","https://openalex.org/W2059721481","https://openalex.org/W2074042377","https://openalex.org/W2081128650","https://openalex.org/W2106863585","https://openalex.org/W2162207896","https://openalex.org/W2295584263","https://openalex.org/W2345598630","https://openalex.org/W2920964950","https://openalex.org/W2940807311","https://openalex.org/W2966463142","https://openalex.org/W3028314871","https://openalex.org/W3035078642","https://openalex.org/W3094267028","https://openalex.org/W3122470770","https://openalex.org/W3134349630","https://openalex.org/W3217144149","https://openalex.org/W4285212922","https://openalex.org/W4285307873","https://openalex.org/W4309669389","https://openalex.org/W4312707215","https://openalex.org/W4321195885","https://openalex.org/W4321484266","https://openalex.org/W4386280880","https://openalex.org/W4388270223","https://openalex.org/W4391785548"],"related_works":["https://openalex.org/W1548357495","https://openalex.org/W2314048082","https://openalex.org/W1968487248","https://openalex.org/W2097006611","https://openalex.org/W4295916778","https://openalex.org/W3036464408","https://openalex.org/W2020990755","https://openalex.org/W2112995122","https://openalex.org/W2377851227","https://openalex.org/W2165087119"],"abstract_inverted_index":{"In":[0],"the":[1,4,42,55,97,115,125,150,161],"field":[2],"of":[3,6,44,58,100],"Internet":[5],"Unmanned":[7],"Agents":[8],"(IUA),":[9],"autonomous":[10],"devices":[11],"often":[12],"struggle":[13],"to":[14,34,66,87],"maintain":[15],"stability,":[16],"adaptability,":[17],"and":[18,40,70,91,107,119,145,153],"coordination":[19,43,154],"in":[20,60,122,155,167],"dynamic":[21],"environments.":[22],"Current":[23],"control":[24,72,138],"strategies":[25],"are":[26],"hindered":[27],"by":[28],"difficulties":[29],"such":[30],"as":[31],"real-time":[32],"adaptation":[33],"environmental":[35],"changes,":[36],"handling":[37],"sensor":[38],"noise,":[39],"managing":[41],"multiple":[45,143],"agents":[46],"under":[47],"complex,":[48],"variable":[49],"task":[50],"constraints.":[51,146],"These":[52],"challenges":[53],"limit":[54],"practical":[56],"deployment":[57],"robots":[59],"IUA":[61,168],"systems,":[62],"making":[63],"it":[64],"crucial":[65],"develop":[67],"more":[68],"robust":[69],"efficient":[71],"methods.":[73],"To":[74],"address":[75],"these":[76],"issues,":[77],"we":[78],"propose":[79],"a":[80],"reinforcement":[81,104],"learning-based":[82],"impedance":[83,95],"coefficient":[84],"optimization":[85],"approach":[86,112],"improve":[88],"robots\u2019":[89,151],"stability":[90],"responsiveness.":[92],"By":[93],"integrating":[94],"control,":[96],"Divergent":[98],"Component":[99],"Motion":[101],"(DCM)":[102],"model,":[103],"learning":[105],"(RL),":[106],"quadratic":[108],"programming":[109],"(QP),":[110],"this":[111],"dynamically":[113],"adjusts":[114],"robot\u2019s":[116],"stiffness,":[117],"damping,":[118],"inertia":[120],"coefficients":[121],"real-time.":[123],"Specifically,":[124],"Soft":[126],"Actor-Critic":[127],"(SAC)":[128],"algorithm":[129],"is":[130],"used":[131],"for":[132],"optimization,":[133],"while":[134],"QP":[135],"ensures":[136],"that":[137],"forces":[139],"remain":[140],"feasible":[141],"across":[142],"tasks":[144],"This":[147],"strategy":[148],"enhances":[149],"adaptability":[152],"complex":[156],"IUA.":[157],"Experimental":[158],"results":[159],"validate":[160],"approach,":[162],"significantly":[163],"improving":[164],"robot":[165],"performance":[166],"systems.":[169]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
