{"id":"https://openalex.org/W4399391273","doi":"https://doi.org/10.1007/s10514-024-10162-8","title":"Reinforcement learning based autonomous multi-rotor landing on moving platforms","display_name":"Reinforcement learning based autonomous multi-rotor landing on moving platforms","publication_year":2024,"publication_date":"2024-06-06","ids":{"openalex":"https://openalex.org/W4399391273","doi":"https://doi.org/10.1007/s10514-024-10162-8"},"language":"en","primary_location":{"id":"doi:10.1007/s10514-024-10162-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10514-024-10162-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10514-024-10162-8.pdf","source":{"id":"https://openalex.org/S144091109","display_name":"Autonomous Robots","issn_l":"0929-5593","issn":["0929-5593","1573-7527"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Robots","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10514-024-10162-8.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068489098","display_name":"Pascal Goldschmid","orcid":"https://orcid.org/0000-0003-4854-1028"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]},{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Pascal Goldschmid","raw_affiliation_strings":["Max Planck Institute for Intelligent Systems, 72076, T\u00fcbingen, Baden-W\u00fcrttemberg, Germany","University of Stuttgart, 70569, Stuttgart, Germany"],"affiliations":[{"raw_affiliation_string":"Max Planck Institute for Intelligent Systems, 72076, T\u00fcbingen, Baden-W\u00fcrttemberg, Germany","institution_ids":["https://openalex.org/I4210135521"]},{"raw_affiliation_string":"University of Stuttgart, 70569, Stuttgart, Germany","institution_ids":["https://openalex.org/I100066346"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087038946","display_name":"Aamir Ahmad","orcid":"https://orcid.org/0000-0002-0727-3031"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]},{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Aamir Ahmad","raw_affiliation_strings":["Max Planck Institute for Intelligent Systems, 72076, T\u00fcbingen, Baden-W\u00fcrttemberg, Germany","University of Stuttgart, 70569, Stuttgart, Germany"],"affiliations":[{"raw_affiliation_string":"Max Planck Institute for Intelligent Systems, 72076, T\u00fcbingen, Baden-W\u00fcrttemberg, Germany","institution_ids":["https://openalex.org/I4210135521"]},{"raw_affiliation_string":"University of Stuttgart, 70569, Stuttgart, Germany","institution_ids":["https://openalex.org/I100066346"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068489098"],"corresponding_institution_ids":["https://openalex.org/I100066346","https://openalex.org/I4210135521"],"apc_list":{"value":2590,"currency":"EUR","value_usd":3390},"apc_paid":{"value":2590,"currency":"EUR","value_usd":3390},"fwci":0.2442,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.48336182,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"48","issue":"4-5","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11615","display_name":"Control and Dynamics of Mobile Robots","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8837636709213257},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8747700452804565},{"id":"https://openalex.org/keywords/rotor","display_name":"Rotor (electric)","score":0.5872620344161987},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4728717505931854},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4613513946533203},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.34278056025505066},{"id":"https://openalex.org/keywords/mechanical-engineering","display_name":"Mechanical engineering","score":0.08384910225868225}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8837636709213257},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8747700452804565},{"id":"https://openalex.org/C17281054","wikidata":"https://www.wikidata.org/wiki/Q193466","display_name":"Rotor (electric)","level":2,"score":0.5872620344161987},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4728717505931854},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4613513946533203},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.34278056025505066},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.08384910225868225},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10514-024-10162-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10514-024-10162-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10514-024-10162-8.pdf","source":{"id":"https://openalex.org/S144091109","display_name":"Autonomous Robots","issn_l":"0929-5593","issn":["0929-5593","1573-7527"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Robots","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10514-024-10162-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10514-024-10162-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10514-024-10162-8.pdf","source":{"id":"https://openalex.org/S144091109","display_name":"Autonomous Robots","issn_l":"0929-5593","issn":["0929-5593","1573-7527"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Robots","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320325850","display_name":"Universit\u00e4t Stuttgart","ror":"https://ror.org/04vnq7t77"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4399391273.pdf"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W1533650545","https://openalex.org/W1560368799","https://openalex.org/W1590700457","https://openalex.org/W2063468777","https://openalex.org/W2079517579","https://openalex.org/W2124338262","https://openalex.org/W2465948386","https://openalex.org/W2517829986","https://openalex.org/W2550961113","https://openalex.org/W2555341372","https://openalex.org/W2575417362","https://openalex.org/W2746974548","https://openalex.org/W2765891159","https://openalex.org/W2795566994","https://openalex.org/W2810217655","https://openalex.org/W2889677817","https://openalex.org/W2890755534","https://openalex.org/W2901402208","https://openalex.org/W2908846937","https://openalex.org/W2910655755","https://openalex.org/W2937582027","https://openalex.org/W3012544020","https://openalex.org/W3099548126","https://openalex.org/W3136542217","https://openalex.org/W6637967152","https://openalex.org/W6677067356","https://openalex.org/W6677826109"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291"],"abstract_inverted_index":{"Abstract":[0],"Multi-rotor":[1],"UAVs":[2],"suffer":[3],"from":[4,72],"a":[5,19,67,75,116,157,188,270],"restricted":[6],"range":[7],"and":[8,29,45,51,90,150,182,277],"flight":[9],"duration":[10],"due":[11,61],"to":[12,26,62,65,84,96,174,204,255],"limited":[13,87],"battery":[14],"capacity.":[15],"Autonomous":[16],"landing":[17,113],"on":[18,42,92,166,281,291],"2D":[20],"moving":[21,172,202],"platform":[22,173,203],"offers":[23],"the":[24,34,37,49,52,112,132,143,148,151,171,178,185,197,201,210,218,226,239,244,292],"possibility":[25],"replenish":[27],"batteries":[28],"offload":[30],"data,":[31],"thus":[32],"increasing":[33],"utility":[35],"of":[36,48,118,131,170,200,217,246],"vehicle.":[38,220],"Classical":[39],"approaches":[40],"rely":[41],"accurate,":[43],"complex":[44],"difficult-to-derive":[46],"models":[47],"vehicle":[50],"environment.":[53],"Reinforcement":[54],"learning":[55,122],"(RL)":[56],"provides":[57],"an":[58],"attractive":[59],"alternative":[60],"its":[63],"ability":[64],"learn":[66],"suitable":[68],"control":[69],"policy":[70],"exclusively":[71],"data":[73],"during":[74],"training":[76,186,211,222,252],"procedure.":[77],"However,":[78],"current":[79],"methods":[80],"require":[81],"several":[82],"hours":[83],"train,":[85],"have":[86],"success":[88],"rates":[89],"depend":[91],"hyperparameters":[93,208],"that":[94,163,213,238],"need":[95],"be":[97],"tuned":[98],"by":[99,127],"trial-and-error.":[100],"We":[101],"address":[102],"all":[103,285],"these":[104],"issues":[105],"in":[106,146],"this":[107],"work.":[108],"First,":[109],"we":[110,155,195,236,275,288],"decompose":[111],"procedure":[114],"into":[115],"sequence":[117],"simpler,":[119],"but":[120],"similar":[121],"tasks.":[123],"This":[124],"is":[125,164,223,297],"enabled":[126],"applying":[128],"two":[129,262],"instances":[130],"same":[133],"RL":[134,228,258],"based":[135,165],"controller":[136],"trained":[137],"for":[138,141,209,261],"1D":[139],"motion":[140],"controlling":[142],"multi-rotor\u2019s":[144],"movement":[145],"both":[147],"longitudinal":[149],"lateral":[152],"directions.":[153],"Second,":[154],"introduce":[156],"powerful":[158],"state":[159,179],"space":[160,180],"discretization":[161],"technique":[162],"i)":[167],"kinematic":[168],"modeling":[169],"derive":[175,206],"information":[176],"about":[177],"topology":[181],"ii)":[183],"structuring":[184],"as":[187],"sequential":[189],"curriculum":[190],"using":[191,225],"transfer":[192],"learning.":[193],"Third,":[194],"leverage":[196],"kinematics":[198],"model":[199],"also":[205],"interpretable":[207],"process":[212],"ensure":[214],"sufficient":[215],"maneuverability":[216],"multi-rotor":[219],"The":[221],"performed":[224],"tabular":[227],"method":[229,241],"Double":[230],"Q-Learning":[231],".":[232,302],"Through":[233],"extensive":[234],"simulations":[235],"show":[237],"presented":[240],"significantly":[242],"increases":[243],"rate":[245],"successful":[247],"landings,":[248],"while":[249],"requiring":[250],"less":[251],"time":[253],"compared":[254],"other":[256],"deep":[257],"approaches.":[259],"Furthermore,":[260],"comparison":[263],"scenarios":[264,287],"it":[265],"achieves":[266],"comparable":[267],"performance":[268],"than":[269],"cascaded":[271],"PI":[272],"controller.":[273],"Finally,":[274],"deploy":[276],"demonstrate":[278],"our":[279],"algorithm":[280],"real":[282],"hardware.":[283],"For":[284],"evaluation":[286],"provide":[289],"statistics":[290],"agent\u2019s":[293],"performance.":[294],"Source":[295],"code":[296],"openly":[298],"available":[299],"at":[300],"https://github.com/robot-perception-group/rl_multi_rotor_landing":[301]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-10-10T00:00:00"}
