{"id":"https://openalex.org/W4415482115","doi":"https://doi.org/10.1109/tcst.2025.3619986","title":"Efficient Exploration in Large State-Action Space Through Structured Action Space for Learning Multirobots Motion Planning","display_name":"Efficient Exploration in Large State-Action Space Through Structured Action Space for Learning Multirobots Motion Planning","publication_year":2025,"publication_date":"2025-10-23","ids":{"openalex":"https://openalex.org/W4415482115","doi":"https://doi.org/10.1109/tcst.2025.3619986"},"language":null,"primary_location":{"id":"doi:10.1109/tcst.2025.3619986","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2025.3619986","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057898837","display_name":"Chaoxu Mu","orcid":"https://orcid.org/0000-0003-1055-9513"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chaoxu Mu","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018783984","display_name":"Zewu Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zewu Jiang","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003736415","display_name":"Jiadong Zhang","orcid":"https://orcid.org/0009-0004-1042-5421"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junnan Zhang","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040414354","display_name":"Ke Wang","orcid":"https://orcid.org/0000-0002-8306-1663"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Wang","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053112608","display_name":"Xin Xu","orcid":"https://orcid.org/0000-0003-3238-745X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Xu","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100620233","display_name":"Jun Yi","orcid":"https://orcid.org/0000-0001-9154-6620"},"institutions":[{"id":"https://openalex.org/I168337820","display_name":"Chongqing University of Science and Technology","ror":"https://ror.org/03n3v6d52","country_code":"CN","type":"education","lineage":["https://openalex.org/I168337820"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Yi","raw_affiliation_strings":["College of Electronic and Information Engineering, Chongqing University of Science and Technology, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Electronic and Information Engineering, Chongqing University of Science and Technology, Chongqing, China","institution_ids":["https://openalex.org/I168337820"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5057898837"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":2.4362,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.91002529,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"34","issue":"1","first_page":"304","last_page":"317"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9807000160217285,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9613999724388123,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workspace","display_name":"Workspace","score":0.7786999940872192},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7378000020980835},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.7163000106811523},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6371999979019165},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5981000065803528},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5891000032424927},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5338000059127808},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5303999781608582},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.5073000192642212}],"concepts":[{"id":"https://openalex.org/C58581272","wikidata":"https://www.wikidata.org/wiki/Q12741163","display_name":"Workspace","level":3,"score":0.7786999940872192},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7378000020980835},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.7163000106811523},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6547999978065491},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6371999979019165},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5981000065803528},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5891000032424927},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5608000159263611},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5338000059127808},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5303999781608582},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.5073000192642212},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.42320001125335693},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4104999899864197},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.39320001006126404},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.35370001196861267},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33820000290870667},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3328000009059906},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.3255000114440918},{"id":"https://openalex.org/C104060986","wikidata":"https://www.wikidata.org/wiki/Q180046","display_name":"Space exploration","level":2,"score":0.32100000977516174},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2937000095844269},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.2799000144004822},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.2694000005722046},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2655999958515167},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.25690001249313354}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcst.2025.3619986","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2025.3619986","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7181085981","display_name":null,"funder_award_id":"62503356","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1974795838","https://openalex.org/W2005354226","https://openalex.org/W2028945152","https://openalex.org/W2065883524","https://openalex.org/W2070665593","https://openalex.org/W2077758943","https://openalex.org/W2103120971","https://openalex.org/W2128990851","https://openalex.org/W2141664020","https://openalex.org/W2142431032","https://openalex.org/W2144293566","https://openalex.org/W2618530766","https://openalex.org/W2887129694","https://openalex.org/W2950069298","https://openalex.org/W2965676832","https://openalex.org/W2967969632","https://openalex.org/W3004407706","https://openalex.org/W3018036994","https://openalex.org/W3047385205","https://openalex.org/W3094490555","https://openalex.org/W3210288250","https://openalex.org/W4200438872","https://openalex.org/W4229066299","https://openalex.org/W4319165238","https://openalex.org/W4385462854"],"related_works":[],"abstract_inverted_index":{"Multirobots":[0],"tasks,":[1],"such":[2,21],"as":[3],"collaborative":[4],"motion":[5,29,60,74],"planning":[6,61,75],"or":[7],"flexible":[8],"parts":[9],"assembly,":[10],"are":[11,107],"complex":[12],"for":[13,20,96],"autonomous":[14],"robot":[15,18],"operations.":[16],"The":[17],"system":[19],"tasks":[22,56,98,189,208],"would":[23],"need":[24],"a":[25,115,158],"combination":[26,127],"of":[27,89,128,143],"multigoal":[28,97],"control":[30,63],"and":[31,46,62,85,135,170,192,194,209],"collision":[32],"avoidance":[33],"in":[34,103,174],"the":[35,93,120,126,151,206],"shared":[36],"workspace.":[37],"For":[38],"reinforcement":[39],"learning":[40],"(RL)-based":[41],"methods":[42,50],"with":[43,153,195],"enhanced":[44],"flexibility":[45],"broader":[47],"applicability,":[48],"these":[49,111],"struggle":[51],"to":[52,77,118,164],"effectively":[53],"handle":[54],"intricate":[55],"that":[57,132,140,182],"require":[58],"collision-free":[59],"across":[64],"long":[65],"time":[66,198],"horizons.":[67],"Current":[68],"RL":[69,161],"systems":[70],"cannot":[71],"achieve":[72],"efficiently":[73,191],"due":[76],"high":[78],"degrees-of-freedom":[79],"(DoF),":[80],"large-scale":[81,121],"continuous":[82,122,137],"action":[83,123,130,138,146],"space,":[84],"tightly":[86],"coupled":[87],"workspaces":[88],"multirobot":[90],"system.":[91],"Additionally,":[92],"exploration":[94,134],"efficiency":[95],"is":[99,203],"typically":[100],"low,":[101],"particularly":[102],"scenarios":[104],"where":[105],"rewards":[106],"scarce.":[108],"To":[109,149],"tackle":[110],"issues,":[112],"we":[113,156],"propose":[114],"new":[116],"method":[117],"decompose":[119],"space":[124,131,139,147],"into":[125],"discrete":[129],"enhances":[133,141],"small-scale":[136],"accuracy":[142],"structured":[144],"hybrid":[145],"(SHAS).":[148],"train":[150,165],"model":[152,184],"SHAS":[154],"efficiently,":[155],"develop":[157],"task-conditioned":[159],"hierarchical":[160],"(TC-HRL)":[162],"framework":[163],"both":[166],"high-level":[167],"(HL)":[168],"policy":[169,173],"low-level":[171],"(LL)":[172],"parallel.":[175],"Comparative":[176],"experiments":[177],"from":[178],"different":[179],"perspectives":[180],"demonstrate":[181],"our":[183,201],"can":[185],"learn":[186],"multirobots":[187],"manipulation":[188],"more":[190],"stably,":[193],"considerably":[196],"less":[197],"consumption.":[199],"Finally,":[200],"work":[202],"verified":[204],"by":[205],"pick-grasp":[207],"real":[210],"manipulators":[211],"experiments.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-23T00:00:00"}
