{"id":"https://openalex.org/W7084145714","doi":"https://doi.org/10.1109/case58245.2025.11164102","title":"Optimal Multi-agent Reinforcement Learning for Efficient Partially Observable Multi-robot Collaboration in Warehousing","display_name":"Optimal Multi-agent Reinforcement Learning for Efficient Partially Observable Multi-robot Collaboration in Warehousing","publication_year":2025,"publication_date":"2025-08-17","ids":{"openalex":"https://openalex.org/W7084145714","doi":"https://doi.org/10.1109/case58245.2025.11164102"},"language":"en","primary_location":{"id":"doi:10.1109/case58245.2025.11164102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/case58245.2025.11164102","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 21st International Conference on Automation Science and Engineering (CASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Muhammad Naveed Abbas","orcid":null},"institutions":[{"id":"https://openalex.org/I151939572","display_name":"Athlone Institute of Technology","ror":"https://ror.org/02dyxwz31","country_code":"IE","type":"education","lineage":["https://openalex.org/I151939572"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Muhammad Naveed Abbas","raw_affiliation_strings":["Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68"],"affiliations":[{"raw_affiliation_string":"Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68","institution_ids":["https://openalex.org/I151939572"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Paul Liston","orcid":null},"institutions":[{"id":"https://openalex.org/I4210093818","display_name":"Midwest University","ror":"https://ror.org/00jxpy231","country_code":"US","type":"education","lineage":["https://openalex.org/I4210093818"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul Liston","raw_affiliation_strings":["Technological University of the Shannon: Midlands Midwest,Faculty of Business and Hospitality,Athlone,Ireland,N37 HD68"],"affiliations":[{"raw_affiliation_string":"Technological University of the Shannon: Midlands Midwest,Faculty of Business and Hospitality,Athlone,Ireland,N37 HD68","institution_ids":["https://openalex.org/I4210093818"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Brian Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I151939572","display_name":"Athlone Institute of Technology","ror":"https://ror.org/02dyxwz31","country_code":"IE","type":"education","lineage":["https://openalex.org/I151939572"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Brian Lee","raw_affiliation_strings":["Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68"],"affiliations":[{"raw_affiliation_string":"Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68","institution_ids":["https://openalex.org/I151939572"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yuansong Qiao","orcid":null},"institutions":[{"id":"https://openalex.org/I151939572","display_name":"Athlone Institute of Technology","ror":"https://ror.org/02dyxwz31","country_code":"IE","type":"education","lineage":["https://openalex.org/I151939572"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Yuansong Qiao","raw_affiliation_strings":["Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68"],"affiliations":[{"raw_affiliation_string":"Technological University of the Shannon: Midlands Midwest,Software Research Institute,Athlone,Ireland,N37 HD68","institution_ids":["https://openalex.org/I151939572"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I151939572"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.42273136,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2188","last_page":"2193"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10626","display_name":"High-Temperature Coating Behaviors","score":0.3264999985694885,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10626","display_name":"High-Temperature Coating Behaviors","score":0.3264999985694885,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11143","display_name":"High Entropy Alloys Studies","score":0.26989999413490295,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12099","display_name":"Advanced materials and composites","score":0.1738000065088272,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.843999981880188},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.7328000068664551},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6899999976158142},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.6306999921798706},{"id":"https://openalex.org/keywords/visibility","display_name":"Visibility","score":0.4968000054359436},{"id":"https://openalex.org/keywords/dashboard","display_name":"Dashboard","score":0.4717000126838684},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.42829999327659607},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4203999936580658}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.843999981880188},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.7328000068664551},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6899999976158142},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6733999848365784},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.6306999921798706},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.4968000054359436},{"id":"https://openalex.org/C33499554","wikidata":"https://www.wikidata.org/wiki/Q1417134","display_name":"Dashboard","level":2,"score":0.4717000126838684},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.42829999327659607},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4269999861717224},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4203999936580658},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.4104999899864197},{"id":"https://openalex.org/C2777386808","wikidata":"https://www.wikidata.org/wiki/Q5254078","display_name":"Delivery Performance","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.38119998574256897},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.3619000017642975},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.329800009727478},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30059999227523804},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.29170000553131104},{"id":"https://openalex.org/C2778963849","wikidata":"https://www.wikidata.org/wiki/Q1473552","display_name":"Order fulfillment","level":3,"score":0.28119999170303345},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27489998936653137},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C2780695315","wikidata":"https://www.wikidata.org/wiki/Q3799040","display_name":"Unobservable","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2583000063896179},{"id":"https://openalex.org/C123197309","wikidata":"https://www.wikidata.org/wiki/Q2882343","display_name":"Multi-armed bandit","level":3,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/case58245.2025.11164102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/case58245.2025.11164102","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 21st International Conference on Automation Science and Engineering (CASE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1557517019","https://openalex.org/W1641379095","https://openalex.org/W2093997643","https://openalex.org/W2099034771","https://openalex.org/W2145339207","https://openalex.org/W2515724774","https://openalex.org/W2908261578","https://openalex.org/W2963658727","https://openalex.org/W2970026324","https://openalex.org/W3088893925","https://openalex.org/W3163723204","https://openalex.org/W3175153969","https://openalex.org/W3211583675","https://openalex.org/W4226457030","https://openalex.org/W4296913591","https://openalex.org/W4381327650","https://openalex.org/W4383112356","https://openalex.org/W4386634446","https://openalex.org/W4392007398","https://openalex.org/W4404278397","https://openalex.org/W4405787902"],"related_works":[],"abstract_inverted_index":{"Efficient":[0],"collaboration":[1,67],"of":[2,22,64,109],"autonomous":[3,65],"mobile":[4],"robots":[5],"or":[6],"multi-robots":[7],"in":[8,12,54,134],"order":[9,51],"fulfillment":[10,52],"tasks":[11],"warehouses":[13],"enhances":[14,117],"the":[15,19,23,62,73,110,115,130,135,142],"delivery":[16,35,74,127],"rate.":[17,36],"However,":[18],"limited":[20],"visibility":[21],"working":[24],"environment":[25,44],"and":[26,41,101,104,123],"varied":[27],"task":[28,137,144],"configurations":[29],"can":[30],"affect":[31],"their":[32],"throughput,":[33],"i.e.,":[34],"Multi-agent":[37],"reinforcement":[38],"learning":[39],"(MARL)":[40],"a":[42,58,92],"MARL":[43],"with":[45],"partial":[46,69],"observability":[47],"replicating":[48],"real-world":[49],"warehouse":[50],"tasks,":[53],"this":[55,80],"backdrop,":[56],"become":[57],"natural":[59],"choice":[60],"for":[61],"optimization":[63],"multi-robot":[66,78],"under":[68],"observability.":[70],"To":[71],"maximize":[72],"rate":[75,128],"through":[76],"efficient":[77],"collaboration,":[79],"research":[81],"proposes":[82],"Multi-Agent":[83],"Self-attention":[84,97],"Recurrent":[85,98],"Q-Learning":[86],"(MASRQL),":[87],"which":[88],"is":[89],"enabled":[90],"by":[91,119],"general-purpose":[93],"Q-function":[94],"approximator,":[95],"Deep":[96],"Q-Network":[99],"(DSRQN)":[100],"harnesses":[102],"self-attention":[103],"recurrence":[105],"mechanisms.":[106],"The":[107],"findings":[108],"empirical":[111],"analysis":[112],"corroborate":[113],"that":[114],"approach":[116],"efficiency":[118],"achieving":[120],"15.4%,":[121],"29%,":[122],"26.2%":[124],"more":[125],"average":[126],"than":[129],"closest":[131],"performing":[132],"baselines":[133],"respective":[136],"configurations,":[138],"showcasing":[139],"adaptability":[140],"to":[141],"varying":[143],"configurations.":[145]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
