{"id":"https://openalex.org/W7128298045","doi":"https://doi.org/10.1007/s00500-025-10997-y","title":"A hierarchical deep reinforcement learning method for dragging and adjusting objects with dual-arm robot","display_name":"A hierarchical deep reinforcement learning method for dragging and adjusting objects with dual-arm robot","publication_year":2026,"publication_date":"2026-02-07","ids":{"openalex":"https://openalex.org/W7128298045","doi":"https://doi.org/10.1007/s00500-025-10997-y"},"language":"en","primary_location":{"id":"doi:10.1007/s00500-025-10997-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00500-025-10997-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00500-025-10997-y.pdf","source":{"id":"https://openalex.org/S65753830","display_name":"Soft Computing","issn_l":"1432-7643","issn":["1432-7643","1433-7479"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Soft Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00500-025-10997-y.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013737563","display_name":"Saeed Saeedvand","orcid":"https://orcid.org/0000-0002-8294-8625"},"institutions":[{"id":"https://openalex.org/I134161618","display_name":"National Taiwan Normal University","ror":"https://ror.org/059dkdx38","country_code":"TW","type":"education","lineage":["https://openalex.org/I134161618"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Saeed Saeedvand","raw_affiliation_strings":["Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan"],"raw_orcid":"https://orcid.org/0000-0002-8294-8625","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan","institution_ids":["https://openalex.org/I134161618"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029102089","display_name":"Hanjaya Mandala","orcid":"https://orcid.org/0000-0002-8051-4057"},"institutions":[{"id":"https://openalex.org/I134161618","display_name":"National Taiwan Normal University","ror":"https://ror.org/059dkdx38","country_code":"TW","type":"education","lineage":["https://openalex.org/I134161618"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Hanjaya Mandala","raw_affiliation_strings":["Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan","institution_ids":["https://openalex.org/I134161618"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007304954","display_name":"Hadi S. Aghdasi","orcid":"https://orcid.org/0000-0003-1613-7370"},"institutions":[{"id":"https://openalex.org/I41832843","display_name":"University of Tabriz","ror":"https://ror.org/01papkj44","country_code":"IR","type":"education","lineage":["https://openalex.org/I41832843"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Hadi S. Aghdasi","raw_affiliation_strings":["Faculty of Electrical and Computer Engineering, University of Tabriz, Tabriz, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Electrical and Computer Engineering, University of Tabriz, Tabriz, Iran","institution_ids":["https://openalex.org/I41832843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083823417","display_name":"Jacky Baltes","orcid":"https://orcid.org/0000-0003-3360-1892"},"institutions":[{"id":"https://openalex.org/I134161618","display_name":"National Taiwan Normal University","ror":"https://ror.org/059dkdx38","country_code":"TW","type":"education","lineage":["https://openalex.org/I134161618"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jacky Baltes","raw_affiliation_strings":["Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, National Taiwan Normal University, Taipei, Taiwan","institution_ids":["https://openalex.org/I134161618"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5083823417"],"corresponding_institution_ids":["https://openalex.org/I134161618"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24736077,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":"4","first_page":"2303","last_page":"2319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.8646000027656555,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.8646000027656555,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.05299999937415123,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.020800000056624413,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/slipping","display_name":"Slipping","score":0.8062999844551086},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6525999903678894},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6110000014305115},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5943999886512756},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.5533000230789185},{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.5386000275611877},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5360999703407288},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4964999854564667}],"concepts":[{"id":"https://openalex.org/C2777045574","wikidata":"https://www.wikidata.org/wiki/Q196100","display_name":"Slipping","level":2,"score":0.8062999844551086},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7150999903678894},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6525999903678894},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6272000074386597},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6110000014305115},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5943999886512756},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.5533000230789185},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.5386000275611877},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5360999703407288},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5228999853134155},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4964999854564667},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C2775960376","wikidata":"https://www.wikidata.org/wiki/Q1435859","display_name":"Grippers","level":2,"score":0.3727000057697296},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.36230000853538513},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.35589998960494995},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.335999995470047},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.29989999532699585},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.2962999939918518},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.29490000009536743},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.26989999413490295},{"id":"https://openalex.org/C2776799497","wikidata":"https://www.wikidata.org/wiki/Q484298","display_name":"Surface (topology)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00500-025-10997-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00500-025-10997-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00500-025-10997-y.pdf","source":{"id":"https://openalex.org/S65753830","display_name":"Soft Computing","issn_l":"1432-7643","issn":["1432-7643","1433-7479"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Soft Computing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00500-025-10997-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00500-025-10997-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00500-025-10997-y.pdf","source":{"id":"https://openalex.org/S65753830","display_name":"Soft Computing","issn_l":"1432-7643","issn":["1432-7643","1433-7479"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Soft Computing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.4440504312515259,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G2693593002","display_name":null,"funder_award_id":"MOST 108-2634-F-003-004","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G2817843060","display_name":null,"funder_award_id":"MOST 107-2811-E-003-503","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G3386439950","display_name":null,"funder_award_id":"MOST 108-2634-F-003-002","funder_id":"https://openalex.org/F4320323837","funder_display_name":"National Taiwan Normal University"},{"id":"https://openalex.org/G3739910215","display_name":null,"funder_award_id":"MOST 108-2634-F-003-003","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G4162621379","display_name":null,"funder_award_id":"MOST 107","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G4202958531","display_name":null,"funder_award_id":"MOST 107-","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G5504915185","display_name":null,"funder_award_id":"MOST 108-2634-F-003-003","funder_id":"https://openalex.org/F4320323837","funder_display_name":"National Taiwan Normal University"},{"id":"https://openalex.org/G737106015","display_name":null,"funder_award_id":"MOST 108-","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G7892752440","display_name":null,"funder_award_id":"MOST 108-2634-F-003-004","funder_id":"https://openalex.org/F4320323837","funder_display_name":"National Taiwan Normal University"},{"id":"https://openalex.org/G8116753102","display_name":null,"funder_award_id":"MOST 107-2811-E-003-503","funder_id":"https://openalex.org/F4320323837","funder_display_name":"National Taiwan Normal University"},{"id":"https://openalex.org/G8413915558","display_name":null,"funder_award_id":"MOST 108-2634-F-003-002","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"}],"funders":[{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"},{"id":"https://openalex.org/F4320322795","display_name":"Ministry of Science and Technology, Taiwan","ror":"https://ror.org/02kv4zf79"},{"id":"https://openalex.org/F4320323837","display_name":"National Taiwan Normal University","ror":"https://ror.org/059dkdx38"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7128298045.pdf","grobid_xml":"https://content.openalex.org/works/W7128298045.grobid-xml"},"referenced_works_count":54,"referenced_works":["https://openalex.org/W2966661","https://openalex.org/W566530810","https://openalex.org/W1977655452","https://openalex.org/W1999156278","https://openalex.org/W2025768430","https://openalex.org/W2036637075","https://openalex.org/W2041376653","https://openalex.org/W2100495367","https://openalex.org/W2112796928","https://openalex.org/W2123435073","https://openalex.org/W2136655611","https://openalex.org/W2139427956","https://openalex.org/W2145339207","https://openalex.org/W2147168033","https://openalex.org/W2160514056","https://openalex.org/W2205340216","https://openalex.org/W2400535959","https://openalex.org/W2558580397","https://openalex.org/W2562662934","https://openalex.org/W2748271646","https://openalex.org/W2767977875","https://openalex.org/W2810603385","https://openalex.org/W2888085144","https://openalex.org/W2891746250","https://openalex.org/W2906956407","https://openalex.org/W2908012943","https://openalex.org/W2913798177","https://openalex.org/W2921240487","https://openalex.org/W2921247092","https://openalex.org/W2962736495","https://openalex.org/W2963184124","https://openalex.org/W2963634205","https://openalex.org/W2964891674","https://openalex.org/W2970710335","https://openalex.org/W2971058209","https://openalex.org/W2971287348","https://openalex.org/W2973817951","https://openalex.org/W2985713881","https://openalex.org/W2988645098","https://openalex.org/W2988916019","https://openalex.org/W2994241268","https://openalex.org/W2995227139","https://openalex.org/W3003882781","https://openalex.org/W3005451807","https://openalex.org/W3021068810","https://openalex.org/W3021493720","https://openalex.org/W3088232757","https://openalex.org/W3089793705","https://openalex.org/W3167816332","https://openalex.org/W3196896805","https://openalex.org/W4231109964","https://openalex.org/W4319996185","https://openalex.org/W4360994086","https://openalex.org/W4361029804"],"related_works":[],"abstract_inverted_index":{"In":[0,47],"spite":[1],"of":[2,70,84,112,172,181],"the":[3,38,67,71,79,85,88,110,113,120,130,137,167,173],"ease":[4],"with":[5,43,74,176,192],"which":[6],"humans":[7],"can":[8,33],"pick":[9],"up":[10],"and":[11,19,81,115,147,169,185,187],"use":[12,155],"objects,":[13,158],"object":[14,64,86,132],"manipulation":[15,55],"remains":[16],"a":[17,44,100,125,149],"popular":[18],"challenging":[20],"research":[21],"topic":[22],"even":[23],"after":[24],"many":[25],"decades.":[26],"The":[27],"object\u2019s":[28],"shape,":[29],"weight,":[30],"or":[31,59],"position":[32],"make":[34],"it":[35,42],"impossible":[36],"for":[37],"robot":[39],"to":[40,128],"manipulate":[41],"single":[45],"arm.":[46],"such":[48],"situations,":[49],"dual-arm":[50,131],"manipulators":[51],"are":[52],"needed.":[53],"Furthermore,":[54],"may":[56],"require":[57],"dragging":[58,133],"pushing":[60],"objects.":[61],"Dragging":[62],"an":[63,177],"while":[65],"considering":[66],"desired":[68],"orientation":[69],"object,":[72],"along":[73],"uncertainties":[75],"like":[76],"friction":[77],"on":[78,119,148,195],"surface":[80],"possible":[82],"slipping":[83],"in":[87,95,145,183,189],"robot\u2019s":[89],"hands,":[90],"is":[91],"very":[92],"challenging.":[93],"Therefore,":[94],"this":[96],"paper,":[97],"we":[98,140],"introduce":[99],"novel":[101],"hierarchical":[102],"deep":[103],"deterministic":[104],"policy":[105],"gradient":[106],"(HDDPG)":[107],"that":[108],"exploits":[109],"continuity":[111],"state":[114],"action":[116],"spaces":[117],"based":[118],"actor-critic,":[121],"model-free":[122],"algorithm":[123],"as":[124],"strategy":[126],"controller":[127],"solve":[129],"problem.":[134],"To":[135],"evaluate":[136],"proposed":[138,174],"algorithm,":[139,175],"conduct":[141],"extensive":[142],"experiments":[143,165],"both":[144],"simulation":[146],"real":[150,190],"adult-sized":[151],"humanoid":[152],"robot.":[153],"We":[154],"13":[156],"different":[157,197],"including":[159],"keyboards,":[160],"laptops,":[161],"boxes,":[162],"etc.":[163],"These":[164],"demonstrate":[166],"effectiveness":[168],"high":[170],"performance":[171],"average":[178],"success":[179],"rate":[180],"97.3%":[182],"simulations":[184],"93.84%":[186],"91.69%":[188],"environments,":[191],"1560":[193],"attempts":[194],"two":[196],"surfaces.":[198]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2026-02-08T00:00:00"}
