{"id":"https://openalex.org/W4405786494","doi":"https://doi.org/10.1109/iros58592.2024.10801306","title":"Rocket Landing Control with Random Annealing Jump Start Reinforcement Learning","display_name":"Rocket Landing Control with Random Annealing Jump Start Reinforcement Learning","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405786494","doi":"https://doi.org/10.1109/iros58592.2024.10801306"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801306","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801306","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057254330","display_name":"Yuxuan Jiang","orcid":"https://orcid.org/0000-0003-4285-0495"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuxuan Jiang","raw_affiliation_strings":["Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101620888","display_name":"Yujie Yang","orcid":"https://orcid.org/0000-0001-7222-0019"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yujie Yang","raw_affiliation_strings":["Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083843330","display_name":"Zhiqian Lan","orcid":"https://orcid.org/0000-0003-4102-1919"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqian Lan","raw_affiliation_strings":["Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029301375","display_name":"Guojian Zhan","orcid":"https://orcid.org/0000-0002-1246-4860"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guojian Zhan","raw_affiliation_strings":["Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747108","display_name":"Shengbo Eben Li","orcid":"https://orcid.org/0000-0003-4923-3633"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengbo Eben Li","raw_affiliation_strings":["Tsinghua University,College of Artificial Intelligence,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,College of Artificial Intelligence,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101697324","display_name":"Qi Sun","orcid":"https://orcid.org/0000-0002-2664-2509"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Sun","raw_affiliation_strings":["Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,School of Vehicle and Mobility,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070820936","display_name":"Jianhua Ma","orcid":"https://orcid.org/0000-0001-9383-2559"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jian Ma","raw_affiliation_strings":["LandSpace Technology Corporation,Beijing,China,100176"],"affiliations":[{"raw_affiliation_string":"LandSpace Technology Corporation,Beijing,China,100176","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112414003","display_name":"Teng-Jen Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tianwen Yu","raw_affiliation_strings":["LandSpace Technology Corporation,Beijing,China,100176"],"affiliations":[{"raw_affiliation_string":"LandSpace Technology Corporation,Beijing,China,100176","institution_ids":[]}]},{"author_position":"last","author":{"id":null,"display_name":"Changwu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Changwu Zhang","raw_affiliation_strings":["LandSpace Technology Corporation,Beijing,China,100176"],"affiliations":[{"raw_affiliation_string":"LandSpace Technology Corporation,Beijing,China,100176","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5057254330"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":2.7642,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.92942298,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"14026","last_page":"14033"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13855","display_name":"Aerospace Engineering and Control Systems","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/aeronautics","display_name":"Aeronautics","score":0.5954973697662354},{"id":"https://openalex.org/keywords/jump","display_name":"Jump","score":0.5884028077125549},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5629284381866455},{"id":"https://openalex.org/keywords/aerospace-engineering","display_name":"Aerospace engineering","score":0.5385291576385498},{"id":"https://openalex.org/keywords/rocket","display_name":"Rocket (weapon)","score":0.514758825302124},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.46797946095466614},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.34528809785842896},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23187485337257385},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1692863404750824}],"concepts":[{"id":"https://openalex.org/C178802073","wikidata":"https://www.wikidata.org/wiki/Q8421","display_name":"Aeronautics","level":1,"score":0.5954973697662354},{"id":"https://openalex.org/C2780695682","wikidata":"https://www.wikidata.org/wiki/Q4005959","display_name":"Jump","level":2,"score":0.5884028077125549},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5629284381866455},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.5385291576385498},{"id":"https://openalex.org/C187878255","wikidata":"https://www.wikidata.org/wiki/Q2037215","display_name":"Rocket (weapon)","level":2,"score":0.514758825302124},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46797946095466614},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.34528809785842896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23187485337257385},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1692863404750824},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801306","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801306","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2963099939","https://openalex.org/W2963523627","https://openalex.org/W2989847975","https://openalex.org/W2990747716","https://openalex.org/W3015082424","https://openalex.org/W3127561923","https://openalex.org/W4317553716","https://openalex.org/W4362650413","https://openalex.org/W4366158867"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2360879373","https://openalex.org/W2355187745","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W3116416607","https://openalex.org/W2947562066","https://openalex.org/W4387400414","https://openalex.org/W2990912121","https://openalex.org/W4399272190"],"abstract_inverted_index":{"Rocket":[0],"recycling":[1],"is":[2,108,172,223],"a":[3,31,88,94,175],"crucial":[4],"pursuit":[5],"in":[6,16,38,129,195],"aerospace":[7],"technology,":[8],"aimed":[9],"at":[10],"reducing":[11],"costs":[12],"and":[13,126,192,206,209,217,228,236],"environmental":[14,124],"impact":[15],"space":[17],"exploration.":[18],"The":[19,169,220],"primary":[20],"focus":[21],"centers":[22],"on":[23,93,186],"rocket":[24,34,82,96],"landing":[25,83],"control,":[26],"involving":[27],"the":[28,44,54,64,73,78,134,138,141,146,162,232,239],"guidance":[29],"of":[30,46,53,66,81,238],"nonlinear":[32],"under-actuated":[33],"with":[35,87,178],"limited":[36],"fuel":[37],"real-time.":[39],"This":[40,70,155],"challenging":[41],"task":[42],"prompts":[43],"application":[45],"reinforcement":[47],"learning":[48,128],"(RL),":[49],"yet":[50],"goal-oriented":[51,112],"nature":[52],"problem":[55,163],"poses":[56],"difficulties":[57],"for":[58,72,110,140],"standard":[59],"RL":[60,167],"algorithms":[61],"due":[62],"to":[63,91,122,151,166,183],"absence":[65],"intermediate":[67],"reward":[68,205],"signals.":[69],"paper,":[71],"first":[74],"time,":[75],"significantly":[76],"elevates":[77],"success":[79],"rate":[80],"control":[84],"from":[85,174],"8%":[86],"baseline":[89],"controller":[90],"97%":[92],"high-fidelity":[95],"model":[97],"using":[98],"RL.":[99,130],"Our":[100],"approach,":[101],"called":[102],"Random":[103],"Annealing":[104],"Jump":[105],"Start":[106],"(RAJS),":[107],"tailored":[109],"real-world":[111],"problems":[113],"by":[114,145],"leveraging":[115],"prior":[116],"feedback":[117],"controllers":[118],"as":[119],"guide":[120,135,142,170],"policy":[121,127,136,148,215],"facilitate":[123],"exploration":[125,147,159],"In":[131],"each":[132],"episode,":[133],"navigates":[137],"environment":[139],"horizon,":[143],"followed":[144],"taking":[149],"charge":[150],"complete":[152],"remaining":[153],"steps.":[154],"jump-start":[156],"strategy":[157],"prunes":[158],"space,":[160],"rendering":[161],"more":[164],"tractable":[165],"algorithms.":[168],"horizon":[171],"sampled":[173],"uniform":[176],"distribution,":[177],"its":[179],"upper":[180],"bound":[181],"annealing":[182],"zero":[184],"based":[185],"performance":[187,216],"metrics,":[188],"mitigating":[189],"distribution":[190],"shift":[191],"mismatch":[193],"issues":[194],"existing":[196],"methods.":[197],"Additional":[198],"enhancements,":[199],"including":[200],"cascading":[201],"jump":[202],"start,":[203],"refined":[204],"terminal":[207],"condition,":[208],"action":[210],"smoothness":[211,237],"regulation,":[212],"further":[213],"improve":[214],"practical":[218],"applicability.":[219],"proposed":[221,240],"method":[222],"validated":[224],"through":[225],"extensive":[226],"evaluation":[227],"Hardware-in-the-Loop":[229],"testing,":[230],"affirming":[231],"effectiveness,":[233],"real-time":[234],"feasibility,":[235],"controller.":[241]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
