{"id":"https://openalex.org/W4293715378","doi":"https://doi.org/10.3390/robotics11050085","title":"Controlling Fleets of Autonomous Mobile Robots with Reinforcement Learning: A Brief Survey","display_name":"Controlling Fleets of Autonomous Mobile Robots with Reinforcement Learning: A Brief Survey","publication_year":2022,"publication_date":"2022-08-30","ids":{"openalex":"https://openalex.org/W4293715378","doi":"https://doi.org/10.3390/robotics11050085"},"language":"en","primary_location":{"id":"doi:10.3390/robotics11050085","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050085","pdf_url":"https://www.mdpi.com/2218-6581/11/5/85/pdf?version=1663926726","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2218-6581/11/5/85/pdf?version=1663926726","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026833974","display_name":"Mike Wesselh\u00f6ft","orcid":"https://orcid.org/0000-0003-1797-6168"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Mike Wesselh\u00f6ft","raw_affiliation_strings":["Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany"],"raw_orcid":"https://orcid.org/0000-0003-1797-6168","affiliations":[{"raw_affiliation_string":"Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032107440","display_name":"Johannes Hinckeldeyn","orcid":null},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Johannes Hinckeldeyn","raw_affiliation_strings":["Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany"],"raw_orcid":"https://orcid.org/0000-0001-9823-7679","affiliations":[{"raw_affiliation_string":"Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031300298","display_name":"Jochen Kreutzfeldt","orcid":"https://orcid.org/0000-0003-3648-576X"},"institutions":[{"id":"https://openalex.org/I159176309","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956","country_code":"DE","type":"education","lineage":["https://openalex.org/I159176309"]},{"id":"https://openalex.org/I884043246","display_name":"Hamburg University of Technology","ror":"https://ror.org/04bs1pb34","country_code":"DE","type":"education","lineage":["https://openalex.org/I884043246"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Jochen Kreutzfeldt","raw_affiliation_strings":["Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Technical Logistics, Hamburg University of Technology, 21079 Hamburg, Germany","institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5026833974","https://openalex.org/A5031300298","https://openalex.org/A5032107440"],"corresponding_institution_ids":["https://openalex.org/I159176309","https://openalex.org/I884043246"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1773,"currency":"EUR","value_usd":1912},"fwci":1.3873,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.84311638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"11","issue":"5","first_page":"85","last_page":"85"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8280061483383179},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.7092437744140625},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6849954128265381},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6336816549301147},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.6232610940933228},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.47862520813941956},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.44242382049560547},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4150521159172058},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.41261568665504456},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39711228013038635},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.37635719776153564},{"id":"https://openalex.org/keywords/industrial-engineering","display_name":"Industrial engineering","score":0.369829922914505},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.3337708115577698},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1684006154537201},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10404223203659058}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8280061483383179},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.7092437744140625},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6849954128265381},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6336816549301147},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.6232610940933228},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47862520813941956},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.44242382049560547},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4150521159172058},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.41261568665504456},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39711228013038635},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.37635719776153564},{"id":"https://openalex.org/C13736549","wikidata":"https://www.wikidata.org/wiki/Q4489420","display_name":"Industrial engineering","level":1,"score":0.369829922914505},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.3337708115577698},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1684006154537201},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10404223203659058},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/robotics11050085","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050085","pdf_url":"https://www.mdpi.com/2218-6581/11/5/85/pdf?version=1663926726","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:0f8cf1fb7c8443d483c989ce810be135","is_oa":true,"landing_page_url":"https://doaj.org/article/0f8cf1fb7c8443d483c989ce810be135","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, Vol 11, Iss 5, p 85 (2022)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2218-6581/11/5/85/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/robotics11050085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics; Volume 11; Issue 5; Pages: 85","raw_type":"Text"},{"id":"pmh:oai:null:11420/13625","is_oa":true,"landing_page_url":"http://hdl.handle.net/11420/13625","pdf_url":null,"source":{"id":"https://openalex.org/S4306401751","display_name":"tub.dok (Hamburg University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I884043246","host_organization_name":"Hamburg University of Technology","host_organization_lineage":["https://openalex.org/I884043246"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"}],"best_oa_location":{"id":"doi:10.3390/robotics11050085","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050085","pdf_url":"https://www.mdpi.com/2218-6581/11/5/85/pdf?version=1663926726","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5799999833106995,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G4093464883","display_name":null,"funder_award_id":"491268466","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4293715378.pdf","grobid_xml":"https://content.openalex.org/works/W4293715378.grobid-xml"},"referenced_works_count":77,"referenced_works":["https://openalex.org/W1929098649","https://openalex.org/W2060914855","https://openalex.org/W2136360478","https://openalex.org/W2168359464","https://openalex.org/W2485734267","https://openalex.org/W2737529802","https://openalex.org/W2772589676","https://openalex.org/W2794034956","https://openalex.org/W2798885736","https://openalex.org/W2803208334","https://openalex.org/W2892258706","https://openalex.org/W2901645090","https://openalex.org/W2905345646","https://openalex.org/W2908261578","https://openalex.org/W2910509260","https://openalex.org/W2912063360","https://openalex.org/W2962764167","https://openalex.org/W2963809389","https://openalex.org/W2963821308","https://openalex.org/W2965996200","https://openalex.org/W2969277962","https://openalex.org/W2979712929","https://openalex.org/W2982312374","https://openalex.org/W2982316857","https://openalex.org/W2982475776","https://openalex.org/W2995249706","https://openalex.org/W3006677721","https://openalex.org/W3008944235","https://openalex.org/W3008967682","https://openalex.org/W3011810733","https://openalex.org/W3031798691","https://openalex.org/W3037478850","https://openalex.org/W3040817486","https://openalex.org/W3088197938","https://openalex.org/W3088310808","https://openalex.org/W3090027660","https://openalex.org/W3090254537","https://openalex.org/W3091872140","https://openalex.org/W3092786062","https://openalex.org/W3095315965","https://openalex.org/W3100153298","https://openalex.org/W3103635569","https://openalex.org/W3104036373","https://openalex.org/W3111582934","https://openalex.org/W3114657141","https://openalex.org/W3115476618","https://openalex.org/W3120778962","https://openalex.org/W3125505924","https://openalex.org/W3127511342","https://openalex.org/W3128055785","https://openalex.org/W3129616587","https://openalex.org/W3130088494","https://openalex.org/W3132589907","https://openalex.org/W3133734443","https://openalex.org/W3136037938","https://openalex.org/W3136908367","https://openalex.org/W3139298425","https://openalex.org/W3142049818","https://openalex.org/W3143346268","https://openalex.org/W3146487107","https://openalex.org/W3148405392","https://openalex.org/W3158253560","https://openalex.org/W3184116135","https://openalex.org/W3184217219","https://openalex.org/W3186835976","https://openalex.org/W3187410661","https://openalex.org/W3190290950","https://openalex.org/W3193052984","https://openalex.org/W3201099806","https://openalex.org/W3206082228","https://openalex.org/W4226536551","https://openalex.org/W4245916969","https://openalex.org/W4288374418","https://openalex.org/W6634544576","https://openalex.org/W6741312563","https://openalex.org/W6761443123","https://openalex.org/W6929389603"],"related_works":["https://openalex.org/W2280422768","https://openalex.org/W3143197806","https://openalex.org/W4252555497","https://openalex.org/W3121175838","https://openalex.org/W3016293053","https://openalex.org/W1690653314","https://openalex.org/W2401723157","https://openalex.org/W2065055572","https://openalex.org/W2784269775","https://openalex.org/W2952904874"],"abstract_inverted_index":{"Controlling":[0],"a":[1,9,71,83,119,135],"fleet":[2,108],"of":[3,12,61,74,89,91,96,107,110,149,159,168,173],"autonomous":[4],"mobile":[5],"robots":[6],"(AMR)":[7],"is":[8,65],"complex":[10,57],"problem":[11],"optimization.":[13],"Many":[14],"approached":[15],"have":[16],"been":[17],"conducted":[18],"for":[19,54,86],"solving":[20,55],"this":[21,62,97],"problem.":[22],"They":[23],"range":[24],"from":[25],"heuristics,":[26],"which":[27,37],"usually":[28],"do":[29],"not":[30],"find":[31],"an":[32],"optimum,":[33],"to":[34,41,77,114,133],"mathematical":[35],"models,":[36],"are":[38,102,116],"limited":[39],"due":[40],"their":[42],"high":[43],"computational":[44],"effort.":[45],"Machine":[46],"Learning":[47,68],"(ML)":[48],"methods":[49],"offer":[50],"another":[51],"potential":[52],"trajectory":[53],"such":[56],"problems.":[58],"The":[59],"focus":[60],"brief":[63],"survey":[64],"on":[66,128],"Reinforcement":[67],"(RL)":[69],"as":[70],"particular":[72],"type":[73],"ML.":[75],"Due":[76],"the":[78,87,94,105,129,142,147],"reward-based":[79],"optimization,":[80],"RL":[81,115],"offers":[82],"good":[84],"basis":[85],"control":[88,100,109],"fleets":[90,164],"AMR.":[92],"In":[93],"context":[95],"survey,":[98],"different":[99,157,166],"approaches":[101],"investigated":[103],"and":[104,170],"aspects":[106],"AMR":[111,169],"with":[112,165],"respect":[113],"evaluated.":[117],"As":[118],"result,":[120],"six":[121],"fundamental":[122],"key":[123],"problems":[124],"should":[125],"be":[126],"put":[127],"current":[130],"research":[131],"agenda":[132],"enable":[134],"broader":[136],"application":[137],"in":[138],"industry:":[139],"(1)":[140],"overcoming":[141],"\u201csim-to-real":[143],"gap\u201d,":[144],"(2)":[145],"increasing":[146],"robustness":[148],"algorithms,":[150],"(3)":[151],"improving":[152],"data":[153],"efficiency,":[154],"(4)":[155],"integrating":[156],"fields":[158],"application,":[160],"(5)":[161],"enabling":[162],"heterogeneous":[163],"types":[167],"(6)":[171],"handling":[172],"deadlocks.":[174]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2022-08-31T00:00:00"}
