{"id":"https://openalex.org/W2947369369","doi":"https://doi.org/10.1109/lra.2019.2920285","title":"Learning to Plan Hierarchically From Curriculum","display_name":"Learning to Plan Hierarchically From Curriculum","publication_year":2019,"publication_date":"2019-05-31","ids":{"openalex":"https://openalex.org/W2947369369","doi":"https://doi.org/10.1109/lra.2019.2920285","mag":"2947369369"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2019.2920285","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2920285","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1906.07371","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038103937","display_name":"Philippe Morere","orcid":"https://orcid.org/0000-0001-6035-1724"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Philippe Morere","raw_affiliation_strings":["University of Sydney, Sydney, NSW, Australia"],"raw_orcid":"https://orcid.org/0000-0001-6035-1724","affiliations":[{"raw_affiliation_string":"University of Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033725695","display_name":"Lionel Ott","orcid":"https://orcid.org/0000-0001-6554-0575"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Lionel Ott","raw_affiliation_strings":["University of Sydney, Sydney, NSW, Australia"],"raw_orcid":"https://orcid.org/0000-0001-6554-0575","affiliations":[{"raw_affiliation_string":"University of Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062619542","display_name":"F\u00e1bio Ramos","orcid":"https://orcid.org/0000-0002-2996-2188"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Fabio Ramos","raw_affiliation_strings":["University of Sydney, Sydney, NSW, Australia"],"raw_orcid":"https://orcid.org/0000-0002-2996-2188","affiliations":[{"raw_affiliation_string":"University of Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8676,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.80606455,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"4","issue":"3","first_page":"2815","last_page":"2822"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9768999814987183,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7277175784111023},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.713503360748291},{"id":"https://openalex.org/keywords/plan","display_name":"Plan (archaeology)","score":0.6460976600646973},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5640501976013184},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4960714280605316},{"id":"https://openalex.org/keywords/curriculum","display_name":"Curriculum","score":0.49192285537719727},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48728621006011963},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40926507115364075},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09386658668518066}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7277175784111023},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.713503360748291},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.6460976600646973},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5640501976013184},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4960714280605316},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.49192285537719727},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48728621006011963},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40926507115364075},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09386658668518066},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/lra.2019.2920285","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2920285","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1906.07371","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.07371","pdf_url":"https://arxiv.org/pdf/1906.07371","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1906.07371","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.07371","pdf_url":"https://arxiv.org/pdf/1906.07371","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W131069610","https://openalex.org/W1509999309","https://openalex.org/W1546503963","https://openalex.org/W1558068925","https://openalex.org/W1578521162","https://openalex.org/W1591434728","https://openalex.org/W1714211023","https://openalex.org/W1757796397","https://openalex.org/W1978108654","https://openalex.org/W1980035368","https://openalex.org/W1987902506","https://openalex.org/W1997477668","https://openalex.org/W2101355568","https://openalex.org/W2109910161","https://openalex.org/W2115549875","https://openalex.org/W2124125910","https://openalex.org/W2133458291","https://openalex.org/W2143435603","https://openalex.org/W2151645094","https://openalex.org/W2151693816","https://openalex.org/W2162227979","https://openalex.org/W2308567354","https://openalex.org/W2333632897","https://openalex.org/W2337392266","https://openalex.org/W2409715576","https://openalex.org/W2604626881","https://openalex.org/W2616430965","https://openalex.org/W2751258126","https://openalex.org/W2759847408","https://openalex.org/W2787066086","https://openalex.org/W2798866735","https://openalex.org/W2802184653","https://openalex.org/W2898802014","https://openalex.org/W2898963091","https://openalex.org/W2909064322","https://openalex.org/W2952011561","https://openalex.org/W2952258289","https://openalex.org/W2963184571","https://openalex.org/W2963293881","https://openalex.org/W3098184036","https://openalex.org/W4255876299","https://openalex.org/W4298857966","https://openalex.org/W6605295560","https://openalex.org/W6630573394","https://openalex.org/W6634579893","https://openalex.org/W6637967152","https://openalex.org/W6677446445","https://openalex.org/W6679518283","https://openalex.org/W6680976742","https://openalex.org/W6737937804","https://openalex.org/W6745052879","https://openalex.org/W6750506353","https://openalex.org/W6755655695","https://openalex.org/W6756065142"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W3162204513","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W2768698792"],"abstract_inverted_index":{"We":[0,14,88,123],"present":[1],"a":[2,90,107,173,178],"framework":[3,62],"for":[4,58,93],"learning":[5,81,94,164],"to":[6,114,152,158,167],"plan":[7],"hierarchically":[8],"in":[9,22,138,145,172],"domains":[10],"with":[11,54,85,150],"unknown":[12],"dynamics.":[13],"enhance":[15,120],"planning":[16,75,157],"performance":[17],"by":[18,32,43,76],"exploiting":[19],"problem":[20],"structure":[21],"several":[23],"ways:":[24],"First,":[25],"we":[26,50],"simplify":[27],"the":[28,86,104],"search":[29],"over":[30],"plans":[31,40],"leveraging":[33],"knowledge":[34],"of":[35,106,147],"skill":[36,67],"objectives;":[37],"second,":[38],"shorter":[39],"are":[41,111],"generated":[42],"enforcing":[44],"aggressively":[45],"hierarchical":[46],"planning;":[47],"and":[48,69,119,128],"third,":[49],"learn":[51],"transition":[52,64],"dynamics":[53,65],"sparse":[55],"local":[56],"models":[57],"better":[59],"generalization.":[60],"Our":[61,141],"decomposes":[63],"into":[66],"effects":[68],"success":[70],"conditions,":[71],"which":[72],"allows":[73],"fast":[74],"reasoning":[77],"on":[78,177],"effects,":[79],"while":[80,135],"conditions":[82,127],"from":[83,102],"interactions":[84],"world.":[87],"propose":[89],"simple":[91],"method":[92,142],"new":[95],"abstract":[96,117,129],"skills,":[97],"using":[98],"successful":[99],"trajectories":[100],"stemming":[101],"completing":[103],"goals":[105],"curriculum.":[108],"Learned":[109],"skills":[110,118,130],"then":[112],"refined":[113],"leverage":[115],"other":[116],"subsequent":[121],"planning.":[122],"show":[124],"that":[125],"both":[126],"can":[131],"be":[132],"learned":[133],"simultaneously":[134],"planning,":[136],"even":[137],"stochastic":[139],"domains.":[140],"is":[143,170],"validated":[144],"experiments":[146],"increasing":[148],"complexity,":[149],"up":[151],"2100":[153],"states,":[154],"showing":[155],"superior":[156],"classic":[159],"non-hierarchical":[160],"planners":[161],"or":[162],"reinforcement":[163],"methods.":[165],"Applicability":[166],"real-world":[168],"problems":[169],"demonstrated":[171],"simulation-to-real":[174],"transfer":[175],"experiment":[176],"robotic":[179],"manipulator.":[180]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
