{"id":"https://openalex.org/W4280633672","doi":"https://doi.org/10.1007/s10489-022-03550-z","title":"Towards designing a generic and comprehensive deep reinforcement learning framework","display_name":"Towards designing a generic and comprehensive deep reinforcement learning framework","publication_year":2022,"publication_date":"2022-05-19","ids":{"openalex":"https://openalex.org/W4280633672","doi":"https://doi.org/10.1007/s10489-022-03550-z"},"language":"en","primary_location":{"id":"doi:10.1007/s10489-022-03550-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-03550-z","pdf_url":null,"source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1007/s10489-022-03550-z","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103235317","display_name":"Ngoc Duy Nguyen","orcid":"https://orcid.org/0000-0002-4052-5819"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Ngoc Duy Nguyen","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":"https://orcid.org/0000-0002-4052-5819","affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085593383","display_name":"Thanh Thi Nguyen","orcid":"https://orcid.org/0000-0001-9709-1663"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]},{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["AU","US"],"is_corresponding":false,"raw_author_name":"Thanh Thi Nguyen","raw_affiliation_strings":["Center for Translational Data Science, University of Chicago, Street, Chicago, 60615, IL, USA","School of Information Technology, Deakin University, Melbourne, 3002, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Translational Data Science, University of Chicago, Street, Chicago, 60615, IL, USA","institution_ids":["https://openalex.org/I40347166"]},{"raw_affiliation_string":"School of Information Technology, Deakin University, Melbourne, 3002, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091402542","display_name":"Nhat Truong Pham","orcid":"https://orcid.org/0000-0002-8086-6722"},"institutions":[{"id":"https://openalex.org/I141445968","display_name":"Ton Duc Thang University","ror":"https://ror.org/01drq0835","country_code":"VN","type":"education","lineage":["https://openalex.org/I141445968"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Nhat Truong Pham","raw_affiliation_strings":["Division of Computational Mechatronics, Institute for Computational Science, Ton Duc Thang University, Ho Chi Minh City, 72915, Vietnam","Faculty of Electrical and Electronics Engineering, Ton Duc Thang University, Ho Chi Minh City, 72915, Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Computational Mechatronics, Institute for Computational Science, Ton Duc Thang University, Ho Chi Minh City, 72915, Vietnam","institution_ids":["https://openalex.org/I141445968"]},{"raw_affiliation_string":"Faculty of Electrical and Electronics Engineering, Ton Duc Thang University, Ho Chi Minh City, 72915, Vietnam","institution_ids":["https://openalex.org/I141445968"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037305946","display_name":"Van\u2010Dinh Nguyen","orcid":"https://orcid.org/0000-0002-9575-1063"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hai Nguyen","raw_affiliation_strings":["Khoury College of Computer Sciences, Northeastern University, Boston, 02115, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Khoury College of Computer Sciences, Northeastern University, Boston, 02115, MA, USA","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091716031","display_name":"Dang Tu Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dang Tu Nguyen","raw_affiliation_strings":["Amazon Web Services, Seattle, 98144, WA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Amazon Web Services, Seattle, 98144, WA, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104857673","display_name":"Thanh Dang Nguyen","orcid":"https://orcid.org/0000-0002-9844-9345"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]},{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["AU","US"],"is_corresponding":false,"raw_author_name":"Thanh Dang Nguyen","raw_affiliation_strings":["Center for Translational Data Science, University of Chicago, Street, Chicago, 60615, IL, USA","School of Information Technology, Deakin University, Melbourne, 3002, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Translational Data Science, University of Chicago, Street, Chicago, 60615, IL, USA","institution_ids":["https://openalex.org/I40347166"]},{"raw_affiliation_string":"School of Information Technology, Deakin University, Melbourne, 3002, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072923302","display_name":"Chee Peng Lim","orcid":"https://orcid.org/0000-0003-4191-9083"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chee Peng Lim","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000102507","display_name":"Michael Johnstone","orcid":"https://orcid.org/0000-0002-3005-8911"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Michael Johnstone","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040015457","display_name":"Asim Bhatti","orcid":"https://orcid.org/0000-0001-6876-1437"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Asim Bhatti","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046519614","display_name":"Douglas Creighton","orcid":"https://orcid.org/0000-0002-9217-1231"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Douglas Creighton","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015293969","display_name":"Saeid Nahavandi","orcid":"https://orcid.org/0000-0002-0360-5270"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Saeid Nahavandi","raw_affiliation_strings":["Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Systems Research and Innovation, Deakin University, Geelong, 3220, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5103235317"],"corresponding_institution_ids":["https://openalex.org/I149704539"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":1.9115,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.88518398,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"53","issue":"3","first_page":"2967","last_page":"2988"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8976566791534424},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8494629859924316},{"id":"https://openalex.org/keywords/agile-software-development","display_name":"Agile software development","score":0.6524617671966553},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6435336470603943},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5851738452911377},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5789819955825806},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5076123476028442},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.47303029894828796},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.44187361001968384},{"id":"https://openalex.org/keywords/agent-architecture","display_name":"Agent architecture","score":0.44108232855796814},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.43257009983062744},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.41060927510261536},{"id":"https://openalex.org/keywords/intelligent-agent","display_name":"Intelligent agent","score":0.3813649117946625},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.3754640221595764},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32094788551330566}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8976566791534424},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8494629859924316},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.6524617671966553},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6435336470603943},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5851738452911377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5789819955825806},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5076123476028442},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.47303029894828796},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.44187361001968384},{"id":"https://openalex.org/C137703981","wikidata":"https://www.wikidata.org/wiki/Q4692093","display_name":"Agent architecture","level":3,"score":0.44108232855796814},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.43257009983062744},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.41060927510261536},{"id":"https://openalex.org/C74072328","wikidata":"https://www.wikidata.org/wiki/Q1142726","display_name":"Intelligent agent","level":2,"score":0.3813649117946625},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3754640221595764},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32094788551330566},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/s10489-022-03550-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-03550-z","pdf_url":null,"source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:dro.deakin.edu.au:DU:30170170","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401102","display_name":"Own your potential (DEAKIN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149704539","host_organization_name":"Deakin University","host_organization_lineage":["https://openalex.org/I149704539"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"},{"id":"pmh:oai:figshare.com:article/21063802","is_oa":true,"landing_page_url":"https://figshare.com/articles/journal_contribution/Towards_designing_a_generic_and_comprehensive_deep_reinforcement_learning_framework/21063802","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1007/s10489-022-03550-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-03550-z","pdf_url":null,"source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.49000000953674316,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320970","display_name":"Deakin University","ror":"https://ror.org/02czsnj07"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W1518858799","https://openalex.org/W1542791059","https://openalex.org/W1592847719","https://openalex.org/W1949804828","https://openalex.org/W1981025032","https://openalex.org/W1981276685","https://openalex.org/W1982262386","https://openalex.org/W1998649829","https://openalex.org/W2012204020","https://openalex.org/W2012612381","https://openalex.org/W2026653933","https://openalex.org/W2041367235","https://openalex.org/W2099397840","https://openalex.org/W2102660061","https://openalex.org/W2107544712","https://openalex.org/W2126316555","https://openalex.org/W2128453677","https://openalex.org/W2141481921","https://openalex.org/W2145339207","https://openalex.org/W2150468603","https://openalex.org/W2158782408","https://openalex.org/W2161009228","https://openalex.org/W2170480356","https://openalex.org/W2172968643","https://openalex.org/W2257979135","https://openalex.org/W2292533394","https://openalex.org/W2296073425","https://openalex.org/W2546571074","https://openalex.org/W2559655401","https://openalex.org/W2560647685","https://openalex.org/W2583993537","https://openalex.org/W2604272474","https://openalex.org/W2604618034","https://openalex.org/W2612690371","https://openalex.org/W2746553466","https://openalex.org/W2761873684","https://openalex.org/W2768629321","https://openalex.org/W2768919152","https://openalex.org/W2787933113","https://openalex.org/W2788125442","https://openalex.org/W2790759781","https://openalex.org/W2810602713","https://openalex.org/W2901112449","https://openalex.org/W2908261578","https://openalex.org/W2911495555","https://openalex.org/W2945911335","https://openalex.org/W2952298682","https://openalex.org/W2963523627","https://openalex.org/W2963658727","https://openalex.org/W2963934958","https://openalex.org/W2999905431","https://openalex.org/W3010954320","https://openalex.org/W3035574064","https://openalex.org/W3099518626","https://openalex.org/W3100944043","https://openalex.org/W3103752844","https://openalex.org/W3126321819","https://openalex.org/W3159966224","https://openalex.org/W3199357765","https://openalex.org/W3205516620","https://openalex.org/W3205830537","https://openalex.org/W4205779441","https://openalex.org/W4214717370","https://openalex.org/W4246262524","https://openalex.org/W6602539713","https://openalex.org/W6603593944","https://openalex.org/W6604977742","https://openalex.org/W6608803649","https://openalex.org/W6610860872","https://openalex.org/W6814003322","https://openalex.org/W6829155664"],"related_works":["https://openalex.org/W2364921833","https://openalex.org/W4380075502","https://openalex.org/W2385146268","https://openalex.org/W4223943233","https://openalex.org/W4312200629","https://openalex.org/W4360585206","https://openalex.org/W4364306694","https://openalex.org/W4380086463","https://openalex.org/W4225161397","https://openalex.org/W3014300295"],"abstract_inverted_index":{"Abstract":[0],"Reinforcement":[1],"learning":[2,41],"(RL)":[3],"has":[4,29],"emerged":[5],"as":[6,64],"an":[7,12],"effective":[8],"approach":[9],"for":[10],"building":[11],"intelligent":[13],"system,":[14],"which":[15,146],"involves":[16],"multiple":[17],"self-operated":[18],"agents":[19],"to":[20,47,101],"collectively":[21],"accomplish":[22],"a":[23,31,78,86,91,99,103,108,125,130,159,181,185],"designated":[24],"task.":[25],"More":[26],"importantly,":[27],"there":[28,53],"been":[30],"renewed":[32],"focus":[33],"on":[34,180],"RL":[35,45,94,105,183],"since":[36],"the":[37,60,114,135,173,188,193],"introduction":[38],"of":[39,143,190,195],"deep":[40,93,126,160],"that":[42,82,163],"essentially":[43],"makes":[44],"feasible":[46],"operate":[48],"in":[49,59,73,89,107,150],"high-dimensional":[50],"environments.":[51,153],"However,":[52],"are":[54],"many":[55],"diversified":[56],"research":[57],"directions":[58],"current":[61],"literature,":[62],"such":[63],"multi-agent":[65],"and":[66,69,138,168],"multi-objective":[67],"learning,":[68],"human-machine":[70],"interactions.":[71],"Therefore,":[72],"this":[74,155],"paper,":[75],"we":[76,157],"propose":[77],"comprehensive":[79],"software":[80,117,144],"architecture":[81,95,175],"not":[83,178],"only":[84],"plays":[85],"vital":[87],"role":[88],"designing":[90,124],"connect-the-dots":[92],"but":[96],"also":[97,176],"provides":[98],"guideline":[100],"develop":[102],"realistic":[104],"application":[106],"short":[109],"time":[110],"span.":[111],"By":[112],"inheriting":[113],"proposed":[115,174],"architecture,":[116],"managers":[118],"can":[119,133],"foresee":[120],"any":[121],"challenges":[122],"when":[123],"RL-based":[127,161],"system.":[128],"As":[129],"result,":[131],"they":[132],"expedite":[134],"design":[136,158],"process":[137],"actively":[139],"control":[140],"every":[141],"stage":[142],"development,":[145],"is":[147],"especially":[148],"critical":[149],"agile":[151],"development":[152],"For":[154],"reason,":[156],"framework":[162],"strictly":[164],"ensures":[165],"flexibility,":[166],"robustness,":[167],"scalability.":[169],"To":[170],"enforce":[171],"generalization,":[172],"does":[177],"depend":[179],"specific":[182],"algorithm,":[184],"network":[186],"configuration,":[187],"number":[189],"agents,":[191],"or":[192],"type":[194],"agents.":[196]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
