{"id":"https://openalex.org/W4413925307","doi":"https://doi.org/10.1109/icra55743.2025.11127927","title":"ASCENT: Autonomous Skill Learning Toward Complex Embodied Tasks With Foundation Models","display_name":"ASCENT: Autonomous Skill Learning Toward Complex Embodied Tasks With Foundation Models","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413925307","doi":"https://doi.org/10.1109/icra55743.2025.11127927"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11127927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008478142","display_name":"Haolin Wu","orcid":"https://orcid.org/0009-0006-8472-8489"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haolin Wu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yatsen University,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yatsen University,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016547303","display_name":"Yuecheng Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuecheng Liu","raw_affiliation_strings":["Huawei Noah&#x0027;s Ark Lab,Shenzhen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Huawei Noah&#x0027;s Ark Lab,Shenzhen,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025376117","display_name":"Junyi Dong","orcid":"https://orcid.org/0000-0001-7366-8907"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junyi Dong","raw_affiliation_strings":["Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076374123","display_name":"Heng Zhang","orcid":"https://orcid.org/0000-0003-0883-7318"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Zhang","raw_affiliation_strings":["Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062329742","display_name":"Sitong Mao","orcid":"https://orcid.org/0000-0003-2490-2896"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sitong Mao","raw_affiliation_strings":["Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107772128","display_name":"Hesheng Wang","orcid":"https://orcid.org/0000-0002-9959-1634"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hesheng Wang","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Automation,Shanghai,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Automation,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084826798","display_name":"Weigang Wu","orcid":"https://orcid.org/0000-0002-4714-7021"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weigang Wu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yatsen University,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yatsen University,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042268476","display_name":"Shunbo Zhou","orcid":"https://orcid.org/0000-0002-6077-4951"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shunbo Zhou","raw_affiliation_strings":["Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Embodied AI Innovation Lab, Huawei Cloud,Shenzhen,China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1076788,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"16752","last_page":"16758"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.7199000120162964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.7199000120162964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.642799973487854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.6292999982833862,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.859897255897522},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.8285629153251648},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6190809011459351},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.46578875184059143},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39654549956321716},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3537447154521942},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2342437505722046},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.09064039587974548}],"concepts":[{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.859897255897522},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.8285629153251648},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6190809011459351},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.46578875184059143},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39654549956321716},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3537447154521942},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2342437505722046},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.09064039587974548},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11127927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2050755653","https://openalex.org/W2082511574","https://openalex.org/W2961368225","https://openalex.org/W3212380917","https://openalex.org/W4224004358","https://openalex.org/W4383066118","https://openalex.org/W4386065846","https://openalex.org/W4389924455","https://openalex.org/W4393191863","https://openalex.org/W4400905328","https://openalex.org/W4401413701","https://openalex.org/W4401414504","https://openalex.org/W4401416363","https://openalex.org/W4401416949","https://openalex.org/W4402029988","https://openalex.org/W4402660086","https://openalex.org/W4402667028","https://openalex.org/W4402727120","https://openalex.org/W4402753875"],"related_works":["https://openalex.org/W2380179524","https://openalex.org/W4283365723","https://openalex.org/W2963001125","https://openalex.org/W2753017648","https://openalex.org/W2513760693","https://openalex.org/W2062819913","https://openalex.org/W2149544884","https://openalex.org/W2133485962","https://openalex.org/W4246694033","https://openalex.org/W4211188312"],"abstract_inverted_index":{"Collecting":[0],"data":[1,49],"from":[2,51,127,181],"simulated":[3,52,74],"scenarios":[4,75],"for":[5,144,193],"training":[6,159,175,190],"robotic":[7],"skills":[8,126,150],"provides":[9],"a":[10,81,107],"safer":[11],"and":[12,36,67,76,101,161],"more":[13],"controllable":[14],"alternative":[15],"to":[16,72,96,132,154,170,202],"real-world":[17],"environments.":[18],"However,":[19],"it":[20],"demands":[21],"considerable":[22],"effort,":[23],"including":[24],"the":[25,31,37,46,59,120,136,155,164,173,187],"manual":[26],"construction":[27],"of":[28,34,39,48,62,189],"simulation":[29],"environments,":[30],"careful":[32],"design":[33],"tasks,":[35],"challenge":[38],"obtaining":[40],"effective":[41],"trajectories.":[42],"These":[43],"limitations":[44],"hinder":[45],"efficiency":[47],"collection":[50],"scenarios.":[53],"In":[54],"this":[55],"paper,":[56],"we":[57],"leverage":[58],"prior":[60],"knowledge":[61],"Large":[63,68],"Language":[64],"Models":[65,70],"(LLMs)":[66],"Multimodal":[69],"(LMMs)":[71],"generate":[73,102],"embodied":[77],"tasks.":[78],"We":[79],"introduce":[80],"novel":[82],"framework,":[83],"ASCENT":[84,105],"(Autonomous":[85],"Skill":[86],"learning":[87,111,194],"toward":[88],"Complex":[89],"Embodied":[90],"tasks":[91,100,196],"with":[92],"fouNdaTion":[93],"models),":[94],"designed":[95],"efficiently":[97],"accomplish":[98],"these":[99],"trajectory":[103],"data.":[104],"features":[106],"fully":[108],"autonomous":[109],"skill":[110,130,174],"mechanism":[112],"based":[113,177],"on":[114,178],"AI":[115,121,165],"agent.":[116],"During":[117],"task":[118,137],"training,":[119],"agent":[122,166],"identifies":[123],"suitable":[124],"atomic":[125,129,149],"an":[128,141,168],"library":[131],"either":[133],"directly":[134],"complete":[135],"or":[138],"serve":[139],"as":[140],"initial":[142],"policy":[143],"further":[145],"training.":[146],"Newly":[147],"acquired":[148],"are":[151],"subsequently":[152],"added":[153],"library.":[156],"To":[157],"address":[158],"failures":[160],"enhance":[162],"efficiency,":[163],"uses":[167],"LLM":[169],"automatically":[171],"optimize":[172],"process":[176],"feedback":[179],"received":[180],"simulations.":[182],"Experimental":[183],"results":[184],"indicate":[185],"that":[186],"number":[188],"steps":[191],"required":[192],"new":[195],"can":[197],"be":[198],"reduced":[199],"by":[200],"up":[201],"65.9":[203],"%.":[204]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
