{"id":"https://openalex.org/W4416800190","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249355","title":"Reinforcement Learning in Portfolio Management: A Survey of Methods and Trends","display_name":"Reinforcement Learning in Portfolio Management: A Survey of Methods and Trends","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416800190","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249355"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110240317","display_name":"S.Y. Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Silan Hu","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101604725","display_name":"Yulin Huang","orcid":"https://orcid.org/0000-0002-0997-7200"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yulin Huang","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101372987","display_name":"Arjun Agarwal","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Arjun Agarwal","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120060722","display_name":"Tanya Warrier","orcid":"https://orcid.org/0009-0002-8888-6119"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Tanya Warrier","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100708205","display_name":"Yuwen Wang","orcid":"https://orcid.org/0000-0002-7612-7935"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Wang Yuwen","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101323765","display_name":"Haozhe Ma","orcid":"https://orcid.org/0009-0002-7645-0115"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Haozhe Ma","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016292956","display_name":"Zhengding Luo","orcid":"https://orcid.org/0000-0002-2694-5059"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhengding Luo","raw_affiliation_strings":["National University of Singapore,Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore,Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5110240317"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.44319592,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1241","last_page":"1246"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.7562999725341797,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.7562999725341797,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.0674000009894371,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11413","display_name":"Risk and Portfolio Optimization","score":0.0575999990105629,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.745199978351593},{"id":"https://openalex.org/keywords/portfolio","display_name":"Portfolio","score":0.6455000042915344},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.5081999897956848},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.4864000082015991},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4327000081539154},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.37310001254081726}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.745199978351593},{"id":"https://openalex.org/C2780821815","wikidata":"https://www.wikidata.org/wiki/Q5340806","display_name":"Portfolio","level":2,"score":0.6455000042915344},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5415999889373779},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.5081999897956848},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.4864000082015991},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4327000081539154},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41589999198913574},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3643999993801117},{"id":"https://openalex.org/C204036174","wikidata":"https://www.wikidata.org/wiki/Q909380","display_name":"Stock (firearms)","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C74510933","wikidata":"https://www.wikidata.org/wiki/Q1936145","display_name":"Project portfolio management","level":3,"score":0.32820001244544983},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3273000121116638},{"id":"https://openalex.org/C19244329","wikidata":"https://www.wikidata.org/wiki/Q208697","display_name":"Financial market","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.2685000002384186},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.25859999656677246}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1977051850","https://openalex.org/W2145339207","https://openalex.org/W2233997862","https://openalex.org/W2344786740","https://openalex.org/W2965672544","https://openalex.org/W2998034590","https://openalex.org/W3035703686","https://openalex.org/W3040959470","https://openalex.org/W3087349278","https://openalex.org/W3114374801","https://openalex.org/W3163140850","https://openalex.org/W3175835345","https://openalex.org/W3203680104","https://openalex.org/W3213586249","https://openalex.org/W4389219081","https://openalex.org/W4402284121","https://openalex.org/W4404431993"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,49,72],"comprehensive":[4],"survey":[5,69],"of":[6,52,80],"reinforcement":[7],"learning":[8,37],"(RL)":[9],"algorithms":[10],"applied":[11],"to":[12,26,47],"stock":[13],"trading":[14],"and":[15,41,60,82],"portfolio":[16],"management.":[17],"We":[18],"review":[19],"the":[20,53,78],"foundational":[21],"contributions":[22],"that":[23],"introduced":[24],"RL":[25,81],"financial":[27,83],"decision-making,":[28],"as":[29,31,71],"well":[30],"more":[32],"recent":[33],"work":[34,76],"incorporating":[35],"deep":[36],"architectures,":[38],"margin":[39],"constraints,":[40],"domain-specific":[42],"heuristics.":[43],"Our":[44],"goal":[45],"is":[46],"provide":[48],"structured":[50],"overview":[51],"field's":[54],"evolution,":[55],"highlight":[56],"key":[57],"methodological":[58],"advances,":[59],"outline":[61],"areas":[62],"where":[63],"current":[64],"approaches":[65],"face":[66],"limitations.":[67],"The":[68],"serves":[70],"reference":[73],"for":[74],"future":[75],"at":[77],"intersection":[79],"systems.":[84]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
