{"id":"https://openalex.org/W4394755367","doi":"https://doi.org/10.3390/s24082461","title":"Reinforcement Learning Algorithms and Applications in Healthcare and Robotics: A Comprehensive and Systematic Review","display_name":"Reinforcement Learning Algorithms and Applications in Healthcare and Robotics: A Comprehensive and Systematic Review","publication_year":2024,"publication_date":"2024-04-11","ids":{"openalex":"https://openalex.org/W4394755367","doi":"https://doi.org/10.3390/s24082461","pmid":"https://pubmed.ncbi.nlm.nih.gov/38676080"},"language":"en","primary_location":{"id":"doi:10.3390/s24082461","is_oa":true,"landing_page_url":"https://doi.org/10.3390/s24082461","pdf_url":"https://www.mdpi.com/1424-8220/24/8/2461/pdf?version=1712902831","source":{"id":"https://openalex.org/S101949793","display_name":"Sensors","issn_l":"1424-8220","issn":["1424-8220"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sensors","raw_type":"journal-article"},"type":"review","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1424-8220/24/8/2461/pdf?version=1712902831","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024649129","display_name":"Mokhaled N. A. Al-Hamadani","orcid":"https://orcid.org/0000-0002-7042-3178"},"institutions":[{"id":"https://openalex.org/I132735039","display_name":"University of Debrecen","ror":"https://ror.org/02xf66n48","country_code":"HU","type":"education","lineage":["https://openalex.org/I132735039"]},{"id":"https://openalex.org/I4210143651","display_name":"Northern Technical University","ror":"https://ror.org/03ytenv10","country_code":"IQ","type":"education","lineage":["https://openalex.org/I4210143651"]}],"countries":["HU","IQ"],"is_corresponding":true,"raw_author_name":"Mokhaled Al-Hamadani","raw_affiliation_strings":["Department of Data Science and Visualization, Faculty of Informatics, University of Debrecen, H-4032 Debrecen, Hungary","Department of Electronic Techniques, Technical Institute/Alhawija, Northern Technical University, 36001 Kirkuk, Iraq","Doctoral School of Informatics, University of Debrecen, H-4032 Debrecen, Hungary"],"raw_orcid":"https://orcid.org/0000-0002-7042-3178","affiliations":[{"raw_affiliation_string":"Department of Data Science and Visualization, Faculty of Informatics, University of Debrecen, H-4032 Debrecen, Hungary","institution_ids":["https://openalex.org/I132735039"]},{"raw_affiliation_string":"Department of Electronic Techniques, Technical Institute/Alhawija, Northern Technical University, 36001 Kirkuk, Iraq","institution_ids":["https://openalex.org/I4210143651"]},{"raw_affiliation_string":"Doctoral School of Informatics, University of Debrecen, H-4032 Debrecen, Hungary","institution_ids":["https://openalex.org/I132735039"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090966997","display_name":"Mohammed A. Fadhel","orcid":"https://orcid.org/0000-0001-9877-049X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohammed Fadhel","raw_affiliation_strings":["Research and Development Department, Akunah Company, Brisbane, QLD 4120, Australia"],"raw_orcid":"https://orcid.org/0000-0001-9877-049X","affiliations":[{"raw_affiliation_string":"Research and Development Department, Akunah Company, Brisbane, QLD 4120, Australia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102889969","display_name":"Laith Alzubaidi","orcid":"https://orcid.org/0000-0002-7296-5413"},"institutions":[{"id":"https://openalex.org/I160993911","display_name":"Queensland University of Technology","ror":"https://ror.org/03pnv4752","country_code":"AU","type":"education","lineage":["https://openalex.org/I160993911"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Laith Alzubaidi","raw_affiliation_strings":["Centre for Data Science, Queensland University of Technology, Brisbane, QLD 4000, Australia","Research and Development Department, Akunah Company, Brisbane, QLD 4120, Australia","School of Mechanical, Medical, and Process Engineering, Queensland University of Technology, Brisbane, QLD 4000, Australia"],"raw_orcid":"https://orcid.org/0000-0002-7296-5413","affiliations":[{"raw_affiliation_string":"Centre for Data Science, Queensland University of Technology, Brisbane, QLD 4000, Australia","institution_ids":["https://openalex.org/I160993911"]},{"raw_affiliation_string":"Research and Development Department, Akunah Company, Brisbane, QLD 4120, Australia","institution_ids":[]},{"raw_affiliation_string":"School of Mechanical, Medical, and Process Engineering, Queensland University of Technology, Brisbane, QLD 4000, Australia","institution_ids":["https://openalex.org/I160993911"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024867067","display_name":"Bal\u00e1zs Harangi","orcid":"https://orcid.org/0000-0003-4405-2040"},"institutions":[{"id":"https://openalex.org/I132735039","display_name":"University of Debrecen","ror":"https://ror.org/02xf66n48","country_code":"HU","type":"education","lineage":["https://openalex.org/I132735039"]}],"countries":["HU"],"is_corresponding":false,"raw_author_name":"Balazs Harangi","raw_affiliation_strings":["Department of Data Science and Visualization, Faculty of Informatics, University of Debrecen, H-4032 Debrecen, Hungary"],"raw_orcid":"https://orcid.org/0000-0003-4405-2040","affiliations":[{"raw_affiliation_string":"Department of Data Science and Visualization, Faculty of Informatics, University of Debrecen, H-4032 Debrecen, Hungary","institution_ids":["https://openalex.org/I132735039"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5024649129"],"corresponding_institution_ids":["https://openalex.org/I132735039","https://openalex.org/I4210143651"],"apc_list":{"value":2400,"currency":"CHF","value_usd":2598},"apc_paid":{"value":2400,"currency":"CHF","value_usd":2598},"fwci":24.6498,"has_fulltext":true,"cited_by_count":78,"citation_normalized_percentile":{"value":0.99673348,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"24","issue":"8","first_page":"2461","last_page":"2461"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9610999822616577,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9610999822616577,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7215605974197388},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.719218373298645},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6568390727043152},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.6159350872039795},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.581032395362854},{"id":"https://openalex.org/keywords/transformative-learning","display_name":"Transformative learning","score":0.5806790590286255},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4609030485153198},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41570383310317993},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.35774940252304077}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7215605974197388},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.719218373298645},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6568390727043152},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.6159350872039795},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.581032395362854},{"id":"https://openalex.org/C70587473","wikidata":"https://www.wikidata.org/wiki/Q7834111","display_name":"Transformative learning","level":2,"score":0.5806790590286255},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4609030485153198},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41570383310317993},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.35774940252304077},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003695","descriptor_name":"Delivery of Health Care","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":5,"locations":[{"id":"doi:10.3390/s24082461","is_oa":true,"landing_page_url":"https://doi.org/10.3390/s24082461","pdf_url":"https://www.mdpi.com/1424-8220/24/8/2461/pdf?version=1712902831","source":{"id":"https://openalex.org/S101949793","display_name":"Sensors","issn_l":"1424-8220","issn":["1424-8220"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sensors","raw_type":"journal-article"},{"id":"pmid:38676080","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38676080","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sensors (Basel, Switzerland)","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:11053800","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/11053800","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors (Basel)","raw_type":"Text"},{"id":"pmh:oai:doaj.org/article:c97a86278b1e4ccd88a539b2b891fe13","is_oa":false,"landing_page_url":"https://doaj.org/article/c97a86278b1e4ccd88a539b2b891fe13","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors, Vol 24, Iss 8, p 2461 (2024)","raw_type":"article"},{"id":"pmh:oai:eprints.qut.edu.au:248440","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306402607","display_name":"QUT ePrints (Queensland University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I160993911","host_organization_name":"Queensland University of Technology","host_organization_lineage":["https://openalex.org/I160993911"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sensors","raw_type":"Contribution to Journal"}],"best_oa_location":{"id":"doi:10.3390/s24082461","is_oa":true,"landing_page_url":"https://doi.org/10.3390/s24082461","pdf_url":"https://www.mdpi.com/1424-8220/24/8/2461/pdf?version=1712902831","source":{"id":"https://openalex.org/S101949793","display_name":"Sensors","issn_l":"1424-8220","issn":["1424-8220"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sensors","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4394755367.pdf","grobid_xml":"https://content.openalex.org/works/W4394755367.grobid-xml"},"referenced_works_count":97,"referenced_works":["https://openalex.org/W156236648","https://openalex.org/W163688550","https://openalex.org/W2001771035","https://openalex.org/W2017288068","https://openalex.org/W2056653303","https://openalex.org/W2148864095","https://openalex.org/W2169323873","https://openalex.org/W2257979135","https://openalex.org/W2334782222","https://openalex.org/W2514813345","https://openalex.org/W2548907142","https://openalex.org/W2593044849","https://openalex.org/W2755950973","https://openalex.org/W2768956845","https://openalex.org/W2784097471","https://openalex.org/W2794805762","https://openalex.org/W2794908468","https://openalex.org/W2901669506","https://openalex.org/W2911236815","https://openalex.org/W2921628782","https://openalex.org/W2963411833","https://openalex.org/W2965603252","https://openalex.org/W2965664886","https://openalex.org/W2968526727","https://openalex.org/W2978706708","https://openalex.org/W2981707302","https://openalex.org/W2990747716","https://openalex.org/W2999863957","https://openalex.org/W3000235744","https://openalex.org/W3008492644","https://openalex.org/W3023586494","https://openalex.org/W3033115783","https://openalex.org/W3041601928","https://openalex.org/W3046548984","https://openalex.org/W3081200565","https://openalex.org/W3081530595","https://openalex.org/W3088158297","https://openalex.org/W3088310808","https://openalex.org/W3090299930","https://openalex.org/W3090832565","https://openalex.org/W3093339224","https://openalex.org/W3096158155","https://openalex.org/W3100789280","https://openalex.org/W3101875589","https://openalex.org/W3105333898","https://openalex.org/W3109993998","https://openalex.org/W3114263192","https://openalex.org/W3117215073","https://openalex.org/W3120778962","https://openalex.org/W3121342653","https://openalex.org/W3126321819","https://openalex.org/W3127157414","https://openalex.org/W3127770912","https://openalex.org/W3130984490","https://openalex.org/W3132419770","https://openalex.org/W3133805463","https://openalex.org/W3134088580","https://openalex.org/W3140854437","https://openalex.org/W3159596580","https://openalex.org/W3162046098","https://openalex.org/W3164011142","https://openalex.org/W3177163453","https://openalex.org/W3188522443","https://openalex.org/W3198249268","https://openalex.org/W3199517312","https://openalex.org/W3207742429","https://openalex.org/W3209247505","https://openalex.org/W3216283008","https://openalex.org/W3216656735","https://openalex.org/W4200394939","https://openalex.org/W4206251897","https://openalex.org/W4210939259","https://openalex.org/W4212996499","https://openalex.org/W4224049613","https://openalex.org/W4224220194","https://openalex.org/W4224862098","https://openalex.org/W4283215509","https://openalex.org/W4291535767","https://openalex.org/W4306770046","https://openalex.org/W4308095592","https://openalex.org/W4311040084","https://openalex.org/W4311607213","https://openalex.org/W4312613808","https://openalex.org/W4313442619","https://openalex.org/W4316464918","https://openalex.org/W4318464334","https://openalex.org/W4320493509","https://openalex.org/W4320717566","https://openalex.org/W4324135233","https://openalex.org/W4362561002","https://openalex.org/W4362672763","https://openalex.org/W4377030106","https://openalex.org/W4377695283","https://openalex.org/W4384696745","https://openalex.org/W4387721759","https://openalex.org/W4389667056","https://openalex.org/W6684205842"],"related_works":["https://openalex.org/W2357124094","https://openalex.org/W2387399993","https://openalex.org/W2389739210","https://openalex.org/W2348924972","https://openalex.org/W2365736347","https://openalex.org/W2047454415","https://openalex.org/W2070040999","https://openalex.org/W2387293848","https://openalex.org/W2169196470","https://openalex.org/W2250140200"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1],"(RL)":[2],"has":[3,150],"emerged":[4],"as":[5,127],"a":[6,42,62,93,152,171],"dynamic":[7,23],"and":[8,22,39,64,70,83,114,122,130,162,182],"transformative":[9],"paradigm":[10],"in":[11,20,54,89,124,185],"artificial":[12],"intelligence,":[13],"offering":[14],"the":[15,79,141,157,163,177],"promise":[16],"of":[17,67,78,81,96,111,143,159,165,180],"intelligent":[18],"decision-making":[19,33],"complex":[21],"environments.":[24],"This":[25,72,103,168],"unique":[26],"feature":[27],"enables":[28],"RL":[29,44,68,82,97,119,149,181],"to":[30,85,107,140],"address":[31],"sequential":[32],"problems":[34],"with":[35,75,92],"simultaneous":[36],"sampling,":[37],"evaluation,":[38],"feedback.":[40],"As":[41],"result,":[43],"techniques":[45],"have":[46],"become":[47],"suitable":[48],"candidates":[49],"for":[50,155],"developing":[51],"powerful":[52],"solutions":[53],"various":[55],"domains.":[56],"In":[57,116,133],"this":[58,135],"study,":[59],"we":[60],"present":[61],"comprehensive":[63,172],"systematic":[65],"review":[66,73,104,136,169],"algorithms":[69,98],"applications.":[71],"commences":[74],"an":[76],"exploration":[77],"foundations":[80],"proceeds":[84],"examine":[86],"each":[87],"algorithm":[88],"detail,":[90],"concluding":[91],"comparative":[94],"analysis":[95],"based":[99],"on":[100,176],"several":[101],"criteria.":[102],"then":[105],"extends":[106],"two":[108,186],"key":[109],"applications":[110],"RL:":[112],"robotics":[113,117],"healthcare.":[115],"manipulation,":[118],"enhances":[120],"precision":[121],"adaptability":[123],"tasks":[125],"such":[126],"object":[128],"grasping":[129],"autonomous":[131],"learning.":[132],"healthcare,":[134],"turns":[137],"its":[138,183],"focus":[139],"realm":[142],"cell":[144,160],"growth":[145,158],"problems,":[146],"clarifying":[147],"how":[148],"provided":[151],"data-driven":[153],"approach":[154],"optimizing":[156],"cultures":[161],"development":[164],"therapeutic":[166],"solutions.":[167],"offers":[170],"overview,":[173],"shedding":[174],"light":[175],"evolving":[178],"landscape":[179],"potential":[184],"diverse":[187],"yet":[188],"interconnected":[189],"fields.":[190]},"counts_by_year":[{"year":2026,"cited_by_count":18},{"year":2025,"cited_by_count":47},{"year":2024,"cited_by_count":13}],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2025-10-10T00:00:00"}
