{"id":"https://openalex.org/W4396702006","doi":"https://doi.org/10.1145/3647782.3647801","title":"A General Framework on Enhancing Portfolio Management with Reinforcement Learning","display_name":"A General Framework on Enhancing Portfolio Management with Reinforcement Learning","publication_year":2024,"publication_date":"2024-01-12","ids":{"openalex":"https://openalex.org/W4396702006","doi":"https://doi.org/10.1145/3647782.3647801"},"language":"en","primary_location":{"id":"doi:10.1145/3647782.3647801","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3647782.3647801","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 7th International Conference on Computers in Management and Business","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082841573","display_name":"Yinheng Li","orcid":"https://orcid.org/0000-0002-7740-2484"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yinheng Li","raw_affiliation_strings":["Columbia University, USA"],"raw_orcid":"https://orcid.org/0000-0002-7740-2484","affiliations":[{"raw_affiliation_string":"Columbia University, USA","institution_ids":["https://openalex.org/I78577930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052103988","display_name":"Junhao Wang","orcid":"https://orcid.org/0000-0002-3049-6698"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Junhao Wang","raw_affiliation_strings":["Columbia University, USA"],"raw_orcid":"https://orcid.org/0000-0002-3049-6698","affiliations":[{"raw_affiliation_string":"Columbia University, USA","institution_ids":["https://openalex.org/I78577930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044105923","display_name":"Yijie Cao","orcid":"https://orcid.org/0009-0001-9879-7876"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yijie Cao","raw_affiliation_strings":["Columbia University, USA"],"raw_orcid":"https://orcid.org/0009-0001-9879-7876","affiliations":[{"raw_affiliation_string":"Columbia University, USA","institution_ids":["https://openalex.org/I78577930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I78577930"],"apc_list":null,"apc_paid":null,"fwci":0.5972,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.71419756,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"119","last_page":"125"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11413","display_name":"Risk and Portfolio Optimization","score":0.9782000184059143,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9025554656982422},{"id":"https://openalex.org/keywords/portfolio","display_name":"Portfolio","score":0.7475293874740601},{"id":"https://openalex.org/keywords/asset-management","display_name":"Asset management","score":0.656039834022522},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6406872272491455},{"id":"https://openalex.org/keywords/project-portfolio-management","display_name":"Project portfolio management","score":0.6331668496131897},{"id":"https://openalex.org/keywords/asset","display_name":"Asset (computer security)","score":0.6028150916099548},{"id":"https://openalex.org/keywords/database-transaction","display_name":"Database transaction","score":0.555275559425354},{"id":"https://openalex.org/keywords/transaction-cost","display_name":"Transaction cost","score":0.5428770184516907},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.515436053276062},{"id":"https://openalex.org/keywords/portfolio-optimization","display_name":"Portfolio optimization","score":0.480269193649292},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.43033367395401},{"id":"https://openalex.org/keywords/application-portfolio-management","display_name":"Application portfolio management","score":0.42908450961112976},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.3834248483181},{"id":"https://openalex.org/keywords/finance","display_name":"Finance","score":0.2755753993988037},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.2179792821407318},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19064077734947205},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.18292143940925598},{"id":"https://openalex.org/keywords/project-management","display_name":"Project management","score":0.12207388877868652},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.10504597425460815},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.10040444135665894},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08595967292785645}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9025554656982422},{"id":"https://openalex.org/C2780821815","wikidata":"https://www.wikidata.org/wiki/Q5340806","display_name":"Portfolio","level":2,"score":0.7475293874740601},{"id":"https://openalex.org/C2776517139","wikidata":"https://www.wikidata.org/wiki/Q873442","display_name":"Asset management","level":2,"score":0.656039834022522},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6406872272491455},{"id":"https://openalex.org/C74510933","wikidata":"https://www.wikidata.org/wiki/Q1936145","display_name":"Project portfolio management","level":3,"score":0.6331668496131897},{"id":"https://openalex.org/C76178495","wikidata":"https://www.wikidata.org/wiki/Q4808784","display_name":"Asset (computer security)","level":2,"score":0.6028150916099548},{"id":"https://openalex.org/C75949130","wikidata":"https://www.wikidata.org/wiki/Q848010","display_name":"Database transaction","level":2,"score":0.555275559425354},{"id":"https://openalex.org/C98965940","wikidata":"https://www.wikidata.org/wiki/Q877496","display_name":"Transaction cost","level":2,"score":0.5428770184516907},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.515436053276062},{"id":"https://openalex.org/C202655437","wikidata":"https://www.wikidata.org/wiki/Q7231728","display_name":"Portfolio optimization","level":3,"score":0.480269193649292},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.43033367395401},{"id":"https://openalex.org/C73938075","wikidata":"https://www.wikidata.org/wiki/Q2858767","display_name":"Application portfolio management","level":4,"score":0.42908450961112976},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3834248483181},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.2755753993988037},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.2179792821407318},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19064077734947205},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.18292143940925598},{"id":"https://openalex.org/C15952604","wikidata":"https://www.wikidata.org/wiki/Q179012","display_name":"Project management","level":2,"score":0.12207388877868652},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.10504597425460815},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.10040444135665894},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08595967292785645},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3647782.3647801","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3647782.3647801","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 7th International Conference on Computers in Management and Business","raw_type":"proceedings-article"},{"id":"pmh:oai:RePEc:arx:papers:1911.11880","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"preprint"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1498507866","https://openalex.org/W1586419841","https://openalex.org/W2015856032","https://openalex.org/W2153580489","https://openalex.org/W2313727555","https://openalex.org/W2344786740","https://openalex.org/W2499607623","https://openalex.org/W2596367596","https://openalex.org/W2736601468","https://openalex.org/W3121933628","https://openalex.org/W3123710514","https://openalex.org/W4287869621","https://openalex.org/W4300311901"],"related_works":["https://openalex.org/W2391063200","https://openalex.org/W4290722873","https://openalex.org/W2949815404","https://openalex.org/W2599993184","https://openalex.org/W4242815394","https://openalex.org/W2895421876","https://openalex.org/W876197708","https://openalex.org/W2005279158","https://openalex.org/W4313152572","https://openalex.org/W376065488"],"abstract_inverted_index":{"Portfolio":[0],"management":[1,97,158],"is":[2],"the":[3,22,50,113],"art":[4],"and":[5,15,64,105,129,133,160],"science":[6],"in":[7,36,59,137,155,165],"fiance":[8],"that":[9,98],"concerns":[10],"continuous":[11,100],"reallocation":[12,52],"of":[13,115],"funds":[14],"assets":[16],"across":[17],"financial":[18,46,166],"instruments":[19],"to":[20,25,48,61,147],"meet":[21],"desired":[23],"returns":[24],"risk":[26],"profile.":[27],"Deep":[28],"reinforcement":[29],"learning":[30],"(RL)":[31],"has":[32],"gained":[33],"increasing":[34],"interest":[35],"portfolio":[37,65],"management,":[38,66],"where":[39],"RL":[40,63,93,118,153],"agents":[41],"are":[42,56],"trained":[43],"base":[44],"on":[45],"data":[47],"optimize":[49],"asset":[51,96,101,157],"process.":[53],"Though":[54],"there":[55],"prior":[57],"efforts":[58],"trying":[60],"combine":[62],"previous":[67],"works":[68],"did":[69],"not":[70],"consider":[71],"practical":[72],"aspects":[73],"such":[74],"as":[75],"transaction":[76,142],"costs":[77],"or":[78],"short":[79,103],"selling":[80,104],"restrictions,":[81],"limiting":[82],"their":[83,135],"applicability.":[84],"To":[85],"address":[86],"these":[87],"limitations,":[88],"we":[89],"propose":[90],"a":[91,138],"general":[92],"framework":[94],"for":[95,151],"enables":[99],"weights,":[102],"making":[106],"decisions":[107],"with":[108,122,141],"relevant":[109],"features.":[110],"We":[111],"compare":[112],"performance":[114],"three":[116],"different":[117],"algorithms:":[119],"Policy":[120,126],"Gradient":[121],"Actor-Critic":[123],"(PGAC),":[124],"Proximal":[125],"Optimization":[127],"(PPO),":[128],"Evolution":[130],"Strategies":[131],"(ES)":[132],"demonstrate":[134],"advantages":[136],"simulated":[139],"environment":[140],"costs.":[143],"Our":[144],"work":[145],"aims":[146],"provide":[148],"more":[149],"options":[150],"utilizing":[152],"frameworks":[154],"real-life":[156],"scenarios":[159],"can":[161],"benefit":[162],"further":[163],"research":[164],"applications.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
