{"id":"https://openalex.org/W4405785875","doi":"https://doi.org/10.1109/iros58592.2024.10801931","title":"Multi-Fidelity Reinforcement Learning for Minimum Energy Trajectory Planning","display_name":"Multi-Fidelity Reinforcement Learning for Minimum Energy Trajectory Planning","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405785875","doi":"https://doi.org/10.1109/iros58592.2024.10801931"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801931","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801931","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111194469","display_name":"Luke de Castro","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I4210143601","display_name":"Decision Systems (United States)","ror":"https://ror.org/0434dpa13","country_code":"US","type":"company","lineage":["https://openalex.org/I4210143601"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Luke de Castro","raw_affiliation_strings":["Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139"],"affiliations":[{"raw_affiliation_string":"Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069224373","display_name":"Gilhyun Ryou","orcid":"https://orcid.org/0000-0002-6008-5881"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I4210143601","display_name":"Decision Systems (United States)","ror":"https://ror.org/0434dpa13","country_code":"US","type":"company","lineage":["https://openalex.org/I4210143601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gilhyun Ryou","raw_affiliation_strings":["Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139"],"affiliations":[{"raw_affiliation_string":"Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084104604","display_name":"Hyungseuk Ohn","orcid":"https://orcid.org/0000-0001-8821-9696"},"institutions":[{"id":"https://openalex.org/I49946491","display_name":"Hyundai Motors (South Korea)","ror":"https://ror.org/016kvft77","country_code":"KR","type":"company","lineage":["https://openalex.org/I197312522","https://openalex.org/I49946491"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyungseuk Ohn","raw_affiliation_strings":["Hyundai Motor Company"],"affiliations":[{"raw_affiliation_string":"Hyundai Motor Company","institution_ids":["https://openalex.org/I49946491"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081073767","display_name":"Serta\u00e7 Karaman","orcid":"https://orcid.org/0000-0002-2225-7275"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I4210143601","display_name":"Decision Systems (United States)","ror":"https://ror.org/0434dpa13","country_code":"US","type":"company","lineage":["https://openalex.org/I4210143601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sertac Karaman","raw_affiliation_strings":["Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139"],"affiliations":[{"raw_affiliation_string":"Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology,Cambridge,Massachusetts,02139","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111194469"],"corresponding_institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":0.2162,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54307136,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"7710","last_page":"7717"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10768","display_name":"Electric Vehicles and Infrastructure","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8822354674339294},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.7293004989624023},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7074863910675049},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.6812870502471924},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.43193912506103516},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4245303273200989},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.16323089599609375}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8822354674339294},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.7293004989624023},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7074863910675049},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.6812870502471924},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.43193912506103516},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4245303273200989},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.16323089599609375},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801931","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801931","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.7699999809265137,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2162991084","https://openalex.org/W2565201867","https://openalex.org/W2742561000","https://openalex.org/W2963223306","https://openalex.org/W2972099638","https://openalex.org/W3003344567","https://openalex.org/W3110257271","https://openalex.org/W3121471361","https://openalex.org/W3168186466","https://openalex.org/W3192043231","https://openalex.org/W4295856462","https://openalex.org/W4312281527","https://openalex.org/W6631732945","https://openalex.org/W6637968757","https://openalex.org/W6640963894","https://openalex.org/W6674989108","https://openalex.org/W6741002519","https://openalex.org/W6755463424","https://openalex.org/W6756351998","https://openalex.org/W6862583891"],"related_works":["https://openalex.org/W2381850946","https://openalex.org/W4380449851","https://openalex.org/W3125091513","https://openalex.org/W4318832338","https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4323768008","https://openalex.org/W1941703695","https://openalex.org/W4380318855"],"abstract_inverted_index":{"Modeling":[0],"the":[1,79,83,120],"energy":[2,36,86,105,113,129],"consumption":[3],"of":[4],"a":[5,25,45,50,56,67,93,99,103],"quadrotor":[6],"involves":[7],"complex":[8],"electrical":[9],"and":[10],"physical":[11],"dynamics,":[12],"making":[13],"it":[14],"difficult":[15],"to":[16,77,92,102],"optimize.":[17],"To":[18],"address":[19],"this":[20,22],"challenge,":[21],"paper":[23],"presents":[24],"multi-fidelity":[26],"Gaussian":[27],"process":[28],"(MFGP)":[29],"method":[30],"that":[31,66],"efficiently":[32],"learns":[33],"an":[34,126],"accurate":[35],"prediction":[37,87],"model":[38,48,69,88],"by":[39,82,119],"combining":[40],"many":[41],"low-fidelity":[42],"samples":[43,54],"from":[44,55],"simple":[46],"motor":[47],"with":[49],"few":[51],"computationally":[52],"expensive":[53],"numerical":[57],"battery":[58],"simulation.":[59],"We":[60],"present":[61],"extensive":[62],"sample-efficiency":[63],"experiments,":[64],"demonstrating":[65],"single-fidelity":[68],"often":[70],"needs":[71],"10":[72],"times":[73],"more":[74,112],"high-fidelity":[75],"data":[76],"match":[78],"accuracy":[80],"achieved":[81],"MFGP.":[84],"The":[85,108],"is":[89],"then":[90],"applied":[91],"reinforcement":[94],"learning":[95],"(RL)":[96],"agent,":[97],"providing":[98],"reward":[100],"signal":[101],"minimum":[104,121],"planning":[106],"policy.":[107],"RL":[109],"policy":[110],"generates":[111],"efficient":[114],"trajectories":[115],"than":[116],"those":[117],"found":[118],"snap":[122],"baseline":[123],"method,":[124],"achieving":[125],"average":[127],"3.6%":[128],"reduction.":[130]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
