{"id":"https://openalex.org/W4410039590","doi":"https://doi.org/10.1145/3733714","title":"The Evolution of Reinforcement Learning in Quantitative Finance: A Survey","display_name":"The Evolution of Reinforcement Learning in Quantitative Finance: A Survey","publication_year":2025,"publication_date":"2025-05-02","ids":{"openalex":"https://openalex.org/W4410039590","doi":"https://doi.org/10.1145/3733714"},"language":"en","primary_location":{"id":"doi:10.1145/3733714","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733714","pdf_url":null,"source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"},"type":"review","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3733714","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107673095","display_name":"Nikolaos Pippas","orcid":"https://orcid.org/0009-0003-1869-8603"},"institutions":[{"id":"https://openalex.org/I24190266","display_name":"HSBC Holdings","ror":"https://ror.org/02ygdtt22","country_code":"GB","type":"other","lineage":["https://openalex.org/I24190266"]},{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Nikolaos Pippas","raw_affiliation_strings":["Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland and Asset Management, HSBC Holdings plc, London, United Kingdom of Great Britain and Northern Ireland","Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","Asset Management, HSBC Holdings plc, London, United Kingdom of Great Britain and Northern Ireland"],"raw_orcid":"https://orcid.org/0009-0003-1869-8603","affiliations":[{"raw_affiliation_string":"Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland and Asset Management, HSBC Holdings plc, London, United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"Asset Management, HSBC Holdings plc, London, United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I24190266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022103461","display_name":"Elliot A. Ludvig","orcid":"https://orcid.org/0000-0002-0031-6713"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Elliot A. Ludvig","raw_affiliation_strings":["Department of Psychology, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","Department of Psychology, University of Warwick, Coventry United Kingdom of Great Britain and Northern Ireland"],"raw_orcid":"https://orcid.org/0000-0002-0031-6713","affiliations":[{"raw_affiliation_string":"Department of Psychology, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"Department of Psychology, University of Warwick, Coventry United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065040154","display_name":"\u00c7a\u011fatay Turkay","orcid":"https://orcid.org/0000-0001-6788-251X"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Cagatay Turkay","raw_affiliation_strings":["Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","Centre for Interdisciplinary Methodologies, University of Warwick, Coventry United Kingdom of Great Britain and Northern Ireland"],"raw_orcid":"https://orcid.org/0000-0001-6788-251X","affiliations":[{"raw_affiliation_string":"Centre for Interdisciplinary Methodologies, University of Warwick, Coventry, United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"Centre for Interdisciplinary Methodologies, University of Warwick, Coventry United Kingdom of Great Britain and Northern Ireland","institution_ids":["https://openalex.org/I39555362"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5107673095"],"corresponding_institution_ids":["https://openalex.org/I24190266","https://openalex.org/I39555362"],"apc_list":null,"apc_paid":null,"fwci":28.2433,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.99673542,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"57","issue":"11","first_page":"1","last_page":"51"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11270","display_name":"Complex Systems and Time Series Analysis","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11052","display_name":"Energy Load and Power Forecasting","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8330634832382202},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7070851922035217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3512304425239563},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32914865016937256}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8330634832382202},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7070851922035217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3512304425239563},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32914865016937256}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3733714","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733714","pdf_url":null,"source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3733714","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733714","pdf_url":null,"source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":247,"referenced_works":["https://openalex.org/W28412257","https://openalex.org/W32403112","https://openalex.org/W74101598","https://openalex.org/W174135753","https://openalex.org/W206679605","https://openalex.org/W314672738","https://openalex.org/W594621870","https://openalex.org/W605727707","https://openalex.org/W637153065","https://openalex.org/W1538131130","https://openalex.org/W1540476791","https://openalex.org/W1546523058","https://openalex.org/W1552362148","https://openalex.org/W1557517019","https://openalex.org/W1567584060","https://openalex.org/W1569296262","https://openalex.org/W1569368991","https://openalex.org/W1577069963","https://openalex.org/W1585575029","https://openalex.org/W1641379095","https://openalex.org/W1647779468","https://openalex.org/W1821462560","https://openalex.org/W1898724844","https://openalex.org/W1969261117","https://openalex.org/W1970887382","https://openalex.org/W1971646537","https://openalex.org/W1975675278","https://openalex.org/W1977051850","https://openalex.org/W1985291828","https://openalex.org/W1985808284","https://openalex.org/W1988021444","https://openalex.org/W1988270113","https://openalex.org/W1995778537","https://openalex.org/W1995834279","https://openalex.org/W1996342763","https://openalex.org/W1999996900","https://openalex.org/W2001770658","https://openalex.org/W2004463884","https://openalex.org/W2011418219","https://openalex.org/W2011481463","https://openalex.org/W2018964251","https://openalex.org/W2021801581","https://openalex.org/W2046376809","https://openalex.org/W2052848417","https://openalex.org/W2055061420","https://openalex.org/W2064675550","https://openalex.org/W2066176347","https://openalex.org/W2066218565","https://openalex.org/W2067530554","https://openalex.org/W2073194514","https://openalex.org/W2077791698","https://openalex.org/W2078236117","https://openalex.org/W2092348774","https://openalex.org/W2093630205","https://openalex.org/W2097969668","https://openalex.org/W2099233100","https://openalex.org/W2099618002","https://openalex.org/W2100011707","https://openalex.org/W2100677568","https://openalex.org/W2100805904","https://openalex.org/W2103359683","https://openalex.org/W2107878631","https://openalex.org/W2110603299","https://openalex.org/W2113305199","https://openalex.org/W2116347131","https://openalex.org/W2119259871","https://openalex.org/W2119717200","https://openalex.org/W2125520394","https://openalex.org/W2126311658","https://openalex.org/W2130536986","https://openalex.org/W2134658143","https://openalex.org/W2135293965","https://openalex.org/W2136848157","https://openalex.org/W2136922672","https://openalex.org/W2141559645","https://openalex.org/W2142971854","https://openalex.org/W2143152597","https://openalex.org/W2145339207","https://openalex.org/W2148654185","https://openalex.org/W2153580489","https://openalex.org/W2156060469","https://openalex.org/W2160644528","https://openalex.org/W2162288466","https://openalex.org/W2164320228","https://openalex.org/W2165698076","https://openalex.org/W2166215547","https://openalex.org/W2167917621","https://openalex.org/W2168405694","https://openalex.org/W2169015875","https://openalex.org/W2171916252","https://openalex.org/W2173248099","https://openalex.org/W2186820913","https://openalex.org/W2248982967","https://openalex.org/W2258073164","https://openalex.org/W2291973609","https://openalex.org/W2323331210","https://openalex.org/W2324302607","https://openalex.org/W2329976112","https://openalex.org/W2333102730","https://openalex.org/W2344786740","https://openalex.org/W2556781984","https://openalex.org/W2594475271","https://openalex.org/W2617116989","https://openalex.org/W2618354619","https://openalex.org/W2618530766","https://openalex.org/W2624385633","https://openalex.org/W2625101268","https://openalex.org/W2724169821","https://openalex.org/W2736601468","https://openalex.org/W2755613412","https://openalex.org/W2766736793","https://openalex.org/W2778749116","https://openalex.org/W2793864397","https://openalex.org/W2799920757","https://openalex.org/W2803013487","https://openalex.org/W2884462521","https://openalex.org/W2891295326","https://openalex.org/W2892412430","https://openalex.org/W2902907165","https://openalex.org/W2912823139","https://openalex.org/W2914584772","https://openalex.org/W2929930980","https://openalex.org/W2938326684","https://openalex.org/W2941037157","https://openalex.org/W2941095974","https://openalex.org/W2942689159","https://openalex.org/W2963477884","https://openalex.org/W2964199361","https://openalex.org/W2964674144","https://openalex.org/W2967254933","https://openalex.org/W2969799658","https://openalex.org/W2979430717","https://openalex.org/W2982316857","https://openalex.org/W2984702506","https://openalex.org/W2997497843","https://openalex.org/W3005158858","https://openalex.org/W3007681660","https://openalex.org/W3008231236","https://openalex.org/W3011631586","https://openalex.org/W3012223895","https://openalex.org/W3013773438","https://openalex.org/W3015954380","https://openalex.org/W3018556014","https://openalex.org/W3021787434","https://openalex.org/W3022746105","https://openalex.org/W3023986690","https://openalex.org/W3024896014","https://openalex.org/W3033882778","https://openalex.org/W3035020089","https://openalex.org/W3035464578","https://openalex.org/W3035574064","https://openalex.org/W3037286161","https://openalex.org/W3041133507","https://openalex.org/W3045958001","https://openalex.org/W3046559364","https://openalex.org/W3080232699","https://openalex.org/W3081043352","https://openalex.org/W3083252136","https://openalex.org/W3083887855","https://openalex.org/W3089019288","https://openalex.org/W3098465353","https://openalex.org/W3102424720","https://openalex.org/W3104444496","https://openalex.org/W3119653011","https://openalex.org/W3121277445","https://openalex.org/W3121284928","https://openalex.org/W3121285418","https://openalex.org/W3121491670","https://openalex.org/W3121583564","https://openalex.org/W3121933628","https://openalex.org/W3122116365","https://openalex.org/W3122554332","https://openalex.org/W3122563224","https://openalex.org/W3122944446","https://openalex.org/W3123064686","https://openalex.org/W3123598380","https://openalex.org/W3123639445","https://openalex.org/W3123718809","https://openalex.org/W3123979279","https://openalex.org/W3124574433","https://openalex.org/W3125033993","https://openalex.org/W3125331489","https://openalex.org/W3125353710","https://openalex.org/W3125595766","https://openalex.org/W3125681534","https://openalex.org/W3126053622","https://openalex.org/W3126252007","https://openalex.org/W3126577088","https://openalex.org/W3127047144","https://openalex.org/W3129717163","https://openalex.org/W3131308071","https://openalex.org/W3137745307","https://openalex.org/W3143493396","https://openalex.org/W3154200574","https://openalex.org/W3155979157","https://openalex.org/W3157937972","https://openalex.org/W3158302562","https://openalex.org/W3158663546","https://openalex.org/W3158701715","https://openalex.org/W3167712657","https://openalex.org/W3168987897","https://openalex.org/W3194462213","https://openalex.org/W3202263935","https://openalex.org/W3206804449","https://openalex.org/W3208869239","https://openalex.org/W3215210492","https://openalex.org/W4205608359","https://openalex.org/W4206553113","https://openalex.org/W4212774754","https://openalex.org/W4212920864","https://openalex.org/W4224210583","https://openalex.org/W4225724460","https://openalex.org/W4226092483","https://openalex.org/W4226208821","https://openalex.org/W4231057775","https://openalex.org/W4231546411","https://openalex.org/W4233420185","https://openalex.org/W4234277722","https://openalex.org/W4236670843","https://openalex.org/W4238983406","https://openalex.org/W4248510338","https://openalex.org/W4255949318","https://openalex.org/W4285011703","https://openalex.org/W4285206666","https://openalex.org/W4285264914","https://openalex.org/W4285705748","https://openalex.org/W4287206310","https://openalex.org/W4287375108","https://openalex.org/W4287658495","https://openalex.org/W4287659305","https://openalex.org/W4287829453","https://openalex.org/W4289285046","https://openalex.org/W4289552495","https://openalex.org/W4294583247","https://openalex.org/W4295150809","https://openalex.org/W4298289240","https://openalex.org/W4298857966","https://openalex.org/W4300755699","https://openalex.org/W4302423442","https://openalex.org/W4319660349","https://openalex.org/W4362722548","https://openalex.org/W4394662669","https://openalex.org/W4400057307","https://openalex.org/W6704298589","https://openalex.org/W6762015371","https://openalex.org/W6891887856","https://openalex.org/W6967215384"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Reinforcement":[0],"Learning":[1],"(RL)":[2],"has":[3],"experienced":[4],"significant":[5],"advancement":[6],"over":[7],"the":[8,85,101],"past":[9],"decade,":[10],"prompting":[11],"a":[12,63],"growing":[13],"interest":[14],"in":[15,31],"applications":[16,28],"within":[17],"finance.":[18,32],"This":[19,78],"survey":[20,79],"critically":[21],"evaluates":[22],"167":[23],"publications,":[24],"exploring":[25],"diverse":[26],"RL":[27,59,82],"and":[29,43,58,75,99,103],"frameworks":[30],"Financial":[33],"markets,":[34],"marked":[35],"by":[36],"their":[37],"complexity,":[38],"multi-agent":[39,76],"nature,":[40],"information":[41],"asymmetry,":[42],"inherent":[44],"randomness,":[45],"serve":[46],"as":[47],"an":[48],"intriguing":[49],"test-bed":[50],"for":[51,96],"RL.":[52],"Traditional":[53],"finance":[54],"offers":[55],"certain":[56],"solutions,":[57],"advances":[60],"these":[61],"with":[62],"more":[64],"dynamic":[65],"approach,":[66],"incorporating":[67],"machine":[68],"learning":[69],"methods,":[70],"including":[71],"transfer":[72],"learning,":[73],"meta-learning,":[74],"solutions.":[77],"dissects":[80],"key":[81],"components":[83],"through":[84],"lens":[86],"of":[87,105],"Quantitative":[88],"Finance.":[89],"We":[90],"uncover":[91],"emerging":[92],"themes,":[93],"propose":[94],"areas":[95],"future":[97],"research,":[98],"critique":[100],"strengths":[102],"weaknesses":[104],"existing":[106],"methods.":[107]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":9}],"updated_date":"2026-05-10T08:33:47.465468","created_date":"2025-10-10T00:00:00"}
