{"id":"https://openalex.org/W4410771875","doi":"https://doi.org/10.1109/tase.2025.3574162","title":"Explicit-Implicit Subgoal Planning for Long-Horizon Tasks With Sparse Rewards","display_name":"Explicit-Implicit Subgoal Planning for Long-Horizon Tasks With Sparse Rewards","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4410771875","doi":"https://doi.org/10.1109/tase.2025.3574162"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2025.3574162","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3574162","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088586965","display_name":"Fangyuan Wang","orcid":"https://orcid.org/0000-0002-7492-632X"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Fangyuan Wang","raw_affiliation_strings":["Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077958416","display_name":"Anqing Duan","orcid":"https://orcid.org/0000-0002-9666-018X"},"institutions":[{"id":"https://openalex.org/I4210113480","display_name":"Mohamed bin Zayed University of Artificial Intelligence","ror":"https://ror.org/0258gkt32","country_code":"AE","type":"education","lineage":["https://openalex.org/I4210113480"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Anqing Duan","raw_affiliation_strings":["Robotics Department, Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI), Abu Dhabi, United Arab Emirates"],"affiliations":[{"raw_affiliation_string":"Robotics Department, Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI), Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I4210113480"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Peng Zhou","orcid":"https://orcid.org/0000-0002-7020-0943"},"institutions":[{"id":"https://openalex.org/I4396570619","display_name":"Great Bay University","ror":"https://ror.org/01hdgge16","country_code":null,"type":"education","lineage":["https://openalex.org/I4396570619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Zhou","raw_affiliation_strings":["School of Advanced Engineering, Great Bay University, Dongguan, China","School of Advanced Engineering, The Great Bay University, Dongguan, China"],"affiliations":[{"raw_affiliation_string":"School of Advanced Engineering, Great Bay University, Dongguan, China","institution_ids":["https://openalex.org/I4396570619"]},{"raw_affiliation_string":"School of Advanced Engineering, The Great Bay University, Dongguan, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025311829","display_name":"Shengzeng Huo","orcid":"https://orcid.org/0000-0002-7652-8958"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Shengzeng Huo","raw_affiliation_strings":["Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085022758","display_name":"Guodong Guo","orcid":"https://orcid.org/0000-0001-9583-0055"},"institutions":[{"id":"https://openalex.org/I4210165339","display_name":"Ningbo Institute of Industrial Technology","ror":"https://ror.org/05nqg3g04","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165339"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guodong Guo","raw_affiliation_strings":["Ningbo Institute of Digital Twin and Zhejiang Key Laboratory of Industrial Intelligence and Digital Twin, Eastern Institute of Technology (EIT), Ningbo, China","Ningbo Institute of Digital Twin and the Zhejiang Key Laboratory of Industrial Intelligence and Digital Twin, Eastern Institute of Technology (EIT), Ningbo, China"],"affiliations":[{"raw_affiliation_string":"Ningbo Institute of Digital Twin and Zhejiang Key Laboratory of Industrial Intelligence and Digital Twin, Eastern Institute of Technology (EIT), Ningbo, China","institution_ids":["https://openalex.org/I4210165339"]},{"raw_affiliation_string":"Ningbo Institute of Digital Twin and the Zhejiang Key Laboratory of Industrial Intelligence and Digital Twin, Eastern Institute of Technology (EIT), Ningbo, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019906827","display_name":"Chenguang Yang","orcid":"https://orcid.org/0000-0001-5255-5559"},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chenguang Yang","raw_affiliation_strings":["Department of Computer Science, University of Liverpool, Liverpool, U.K","Department of Computer Science, University of Liverpool, Liverpool, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, U.K","institution_ids":["https://openalex.org/I146655781"]},{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, UK","institution_ids":["https://openalex.org/I146655781"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056734737","display_name":"David Navarro-Alarc\u00f3n","orcid":"https://orcid.org/0000-0002-3426-6638"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"David Navarro-Alarcon","raw_affiliation_strings":["Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5088586965"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":4.6468,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.94681608,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"22","issue":null,"first_page":"16038","last_page":"16049"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10571","display_name":"Robotic Mechanisms and Dynamics","score":0.9628999829292297,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10571","display_name":"Robotic Mechanisms and Dynamics","score":0.9628999829292297,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9423999786376953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5425567626953125},{"id":"https://openalex.org/keywords/horizon","display_name":"Horizon","score":0.4182608425617218},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.412430077791214},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3873046338558197},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24992787837982178}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5425567626953125},{"id":"https://openalex.org/C159176650","wikidata":"https://www.wikidata.org/wiki/Q43261","display_name":"Horizon","level":2,"score":0.4182608425617218},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.412430077791214},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3873046338558197},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24992787837982178},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tase.2025.3574162","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3574162","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},{"id":"pmh:oai:ira.lib.polyu.edu.hk:10397/113802","is_oa":false,"landing_page_url":"http://hdl.handle.net/10397/113802","pdf_url":null,"source":{"id":"https://openalex.org/S4306400205","display_name":"PolyU Institutional Research Archive (Hong Kong Polytechnic University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I14243506","host_organization_name":"Hong Kong Polytechnic University","host_organization_lineage":["https://openalex.org/I14243506"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Journal/Magazine Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1554606642","display_name":null,"funder_award_id":"C4042-23GF","funder_id":"https://openalex.org/F4320321592","funder_display_name":"Research Grants Council, University Grants Committee"},{"id":"https://openalex.org/G1856402315","display_name":null,"funder_award_id":"220724983","funder_id":"https://openalex.org/F4320323537","funder_display_name":"Hong Kong University of Science and Technology"},{"id":"https://openalex.org/G1976017976","display_name":null,"funder_award_id":"15231023","funder_id":"https://openalex.org/F4320321592","funder_display_name":"Research Grants Council, University Grants Committee"},{"id":"https://openalex.org/G2761890982","display_name":null,"funder_award_id":"15212721","funder_id":"https://openalex.org/F4320321592","funder_display_name":"Research Grants Council, University Grants Committee"}],"funders":[{"id":"https://openalex.org/F4320321592","display_name":"Research Grants Council, University Grants Committee","ror":"https://ror.org/00djwmt25"},{"id":"https://openalex.org/F4320323537","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W2060914855","https://openalex.org/W2064675550","https://openalex.org/W2109910161","https://openalex.org/W2225156818","https://openalex.org/W2752796333","https://openalex.org/W2906487027","https://openalex.org/W2963099939","https://openalex.org/W3026627579","https://openalex.org/W3169676024","https://openalex.org/W3200958309","https://openalex.org/W4251436587","https://openalex.org/W4285601030","https://openalex.org/W4289716892","https://openalex.org/W4310849374","https://openalex.org/W4312282783","https://openalex.org/W4375870244","https://openalex.org/W4382465352","https://openalex.org/W4385757466","https://openalex.org/W4389667118","https://openalex.org/W4391529362","https://openalex.org/W4401414182","https://openalex.org/W4401417060","https://openalex.org/W4402753827","https://openalex.org/W6616173779","https://openalex.org/W6640963894","https://openalex.org/W6687045409","https://openalex.org/W6738543193","https://openalex.org/W6740801417","https://openalex.org/W6747473740","https://openalex.org/W6752089545","https://openalex.org/W6753060773","https://openalex.org/W6755655695","https://openalex.org/W6755934310","https://openalex.org/W6756684005","https://openalex.org/W6759871227","https://openalex.org/W6763356705","https://openalex.org/W6767649332","https://openalex.org/W6767862010","https://openalex.org/W6772623567","https://openalex.org/W6776601253","https://openalex.org/W6779780899","https://openalex.org/W6790601966","https://openalex.org/W6797805403","https://openalex.org/W6800425027","https://openalex.org/W6846871237","https://openalex.org/W6857236505"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"The":[0,79,186],"challenges":[1],"inherent":[2],"in":[3,6,18,159,179],"long-horizon":[4,41,177],"tasks":[5,42,178],"robotics":[7],"persist":[8],"due":[9],"to":[10,39,55,87,94,143,162,200],"the":[11,57,60,96,110,121,126,133,145,148,152,156,164,183,211],"typical":[12],"inefficient":[13],"exploration":[14],"and":[15,53,75,90,113,129,182,189],"sparse":[16],"rewards":[17],"traditional":[19],"reinforcement":[20,160],"learning":[21,161],"approaches.":[22],"To":[23,170],"address":[24],"these":[25],"challenges,":[26],"we":[27,174],"have":[28],"developed":[29],"a":[30,44,68,72,76],"novel":[31],"algorithm,":[32],"termed":[33],"hlexplicit-implicit":[34],"subgoal":[35,70,81,168],"planning":[36],"(EISP),":[37],"designed":[38],"tackle":[40],"through":[43],"divide-and-conquer":[45],"approach.":[46],"We":[47],"utilize":[48],"two":[49],"primary":[50],"criteria,":[51],"feasibility":[52,146],"optimality,":[54],"ensure":[56],"quality":[58],"of":[59,65,102,147],"generated":[61,149],"subgoals.":[62,131,150],"EISP":[63],"consists":[64],"three":[66],"components:":[67],"hybrid":[69,80],"generator,":[71],"hindsight":[73,134],"sampler,":[74],"value":[77,153,157],"selector.":[78],"generator":[82],"uses":[83],"an":[84,91,140],"explicit":[85],"model":[86,93],"infer":[88],"subgoals":[89,107,138,166],"implicit":[92],"predict":[95],"final":[97,114,122],"goal,":[98],"inspired":[99],"by":[100,108],"way":[101],"human":[103],"thinking":[104],"that":[105,193],"infers":[106],"using":[109],"current":[111,127],"state":[112,128],"goal":[115,123],"as":[116,118],"well":[117],"reason":[119],"about":[120],"conditioned":[124],"on":[125,210],"given":[130],"Additionally,":[132],"sampler":[135],"selects":[136],"valid":[137],"from":[139,167],"offline":[141],"dataset":[142],"enhance":[144],"While":[151],"selector":[154],"utilizes":[155],"function":[158],"filter":[163],"optimal":[165],"candidates.":[169],"validate":[171],"our":[172,194],"method,":[173],"conduct":[175],"four":[176],"both":[180],"simulation":[181],"real":[184],"world.":[185],"obtained":[187],"quantitative":[188],"qualitative":[190],"data":[191],"indicate":[192],"approach":[195],"achieves":[196],"promising":[197],"performance":[198],"compared":[199],"other":[201],"baseline":[202],"methods.":[203],"These":[204],"experimental":[205],"results":[206],"can":[207],"be":[208],"seen":[209],"website":[212],"https://sites.google.com/view/vaesi.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
