{"id":"https://openalex.org/W4388994331","doi":"https://doi.org/10.1145/3604237.3626906","title":"Margin Trader: A Reinforcement Learning Framework for Portfolio Management with Margin and Constraints","display_name":"Margin Trader: A Reinforcement Learning Framework for Portfolio Management with Margin and Constraints","publication_year":2023,"publication_date":"2023-11-25","ids":{"openalex":"https://openalex.org/W4388994331","doi":"https://doi.org/10.1145/3604237.3626906"},"language":"en","primary_location":{"id":"doi:10.1145/3604237.3626906","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3604237.3626906","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3604237.3626906","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"4th ACM International Conference on AI in Finance","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3604237.3626906","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061857419","display_name":"Jingyi Gu","orcid":"https://orcid.org/0000-0001-8010-8326"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingyi Gu","raw_affiliation_strings":["New Jersey Institute of Technology, US"],"raw_orcid":"https://orcid.org/0000-0001-8010-8326","affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, US","institution_ids":["https://openalex.org/I118118575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002969906","display_name":"Wenlu Du","orcid":"https://orcid.org/0000-0003-4925-0468"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wenlu Du","raw_affiliation_strings":["New Jersey Institute of Technology, US"],"raw_orcid":"https://orcid.org/0000-0003-4925-0468","affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, US","institution_ids":["https://openalex.org/I118118575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005255322","display_name":"A M Muntasir Rahman","orcid":"https://orcid.org/0009-0004-8527-8948"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A M Muntasir Rahman","raw_affiliation_strings":["New Jersey Institute of Technology, US"],"raw_orcid":"https://orcid.org/0009-0004-8527-8948","affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, US","institution_ids":["https://openalex.org/I118118575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100744283","display_name":"Guiling Wang","orcid":"https://orcid.org/0000-0003-1880-4763"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guiling Wang","raw_affiliation_strings":["New Jersey Institute of Technology, US"],"raw_orcid":"https://orcid.org/0000-0003-1880-4763","affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, US","institution_ids":["https://openalex.org/I118118575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.9054,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.86883326,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"610","last_page":"618"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10047","display_name":"Financial Markets and Investment Strategies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10047","display_name":"Financial Markets and Investment Strategies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.8821280598640442},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7563376426696777},{"id":"https://openalex.org/keywords/portfolio","display_name":"Portfolio","score":0.6078354716300964},{"id":"https://openalex.org/keywords/profit-margin","display_name":"Profit margin","score":0.582733154296875},{"id":"https://openalex.org/keywords/sharpe-ratio","display_name":"Sharpe ratio","score":0.540835976600647},{"id":"https://openalex.org/keywords/profit-maximization","display_name":"Profit maximization","score":0.5238247513771057},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5001909732818604},{"id":"https://openalex.org/keywords/trading-strategy","display_name":"Trading strategy","score":0.4847090244293213},{"id":"https://openalex.org/keywords/gross-margin","display_name":"Gross margin","score":0.440062940120697},{"id":"https://openalex.org/keywords/profitability-index","display_name":"Profitability index","score":0.3549128770828247},{"id":"https://openalex.org/keywords/profit","display_name":"Profit (economics)","score":0.32668036222457886},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29028528928756714},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.25746721029281616},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.2476518154144287},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.2393898069858551},{"id":"https://openalex.org/keywords/finance","display_name":"Finance","score":0.21659904718399048},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2139447033405304}],"concepts":[{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.8821280598640442},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7563376426696777},{"id":"https://openalex.org/C2780821815","wikidata":"https://www.wikidata.org/wiki/Q5340806","display_name":"Portfolio","level":2,"score":0.6078354716300964},{"id":"https://openalex.org/C189560676","wikidata":"https://www.wikidata.org/wiki/Q1187906","display_name":"Profit margin","level":2,"score":0.582733154296875},{"id":"https://openalex.org/C139938925","wikidata":"https://www.wikidata.org/wiki/Q1501898","display_name":"Sharpe ratio","level":3,"score":0.540835976600647},{"id":"https://openalex.org/C2777780509","wikidata":"https://www.wikidata.org/wiki/Q1377422","display_name":"Profit maximization","level":3,"score":0.5238247513771057},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5001909732818604},{"id":"https://openalex.org/C131562839","wikidata":"https://www.wikidata.org/wiki/Q1574928","display_name":"Trading strategy","level":2,"score":0.4847090244293213},{"id":"https://openalex.org/C15430695","wikidata":"https://www.wikidata.org/wiki/Q11157999","display_name":"Gross margin","level":3,"score":0.440062940120697},{"id":"https://openalex.org/C129361004","wikidata":"https://www.wikidata.org/wiki/Q2470236","display_name":"Profitability index","level":2,"score":0.3549128770828247},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.32668036222457886},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29028528928756714},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.25746721029281616},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.2476518154144287},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.2393898069858551},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.21659904718399048},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2139447033405304}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3604237.3626906","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3604237.3626906","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3604237.3626906","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"4th ACM International Conference on AI in Finance","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3604237.3626906","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3604237.3626906","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3604237.3626906","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"4th ACM International Conference on AI in Finance","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388994331.pdf","grobid_xml":"https://content.openalex.org/works/W4388994331.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W2121863487","https://openalex.org/W2891295326","https://openalex.org/W2965672544","https://openalex.org/W2997874851","https://openalex.org/W2998034590","https://openalex.org/W3010151722","https://openalex.org/W3011631586","https://openalex.org/W3035414307","https://openalex.org/W3070092463","https://openalex.org/W3114374801","https://openalex.org/W3126066737","https://openalex.org/W3166964686","https://openalex.org/W3175835345","https://openalex.org/W3202263935","https://openalex.org/W3203680104","https://openalex.org/W3212614390","https://openalex.org/W3213586249","https://openalex.org/W3216772467","https://openalex.org/W4283804236","https://openalex.org/W4285600170","https://openalex.org/W4289285046","https://openalex.org/W4302307947","https://openalex.org/W4306317483","https://openalex.org/W4308613547","https://openalex.org/W4312443712","https://openalex.org/W4362722548","https://openalex.org/W4387188031"],"related_works":["https://openalex.org/W2477252478","https://openalex.org/W3132764979","https://openalex.org/W3095472613","https://openalex.org/W3130903212","https://openalex.org/W4283691037","https://openalex.org/W3215054537","https://openalex.org/W4229053708","https://openalex.org/W1844669668","https://openalex.org/W2018042870","https://openalex.org/W2158112318"],"abstract_inverted_index":{"In":[0],"the":[1,18,48,67,99,104,120,170],"field":[2],"of":[3,23],"portfolio":[4],"management":[5,97],"using":[6],"reinforcement":[7,59],"learning,":[8],"existing":[9],"approaches":[10],"have":[11],"mainly":[12],"focused":[13],"on":[14],"cash-only":[15],"trading,":[16],"overlooking":[17],"potential":[19],"benefits":[20],"and":[21,29,57,75,85,95,103,117,132,142,156,162],"risks":[22,158],"margin":[24,27,64,73,130],"trading.":[25],"Incorporating":[26],"accounts":[28,74],"their":[30],"constraints,":[31],"especially":[32],"in":[33,66,159],"short":[34,86],"sale":[35],"scenarios,":[36],"is":[37],"crucial":[38],"yet":[39],"often":[40],"neglected.":[41],"To":[42],"address":[43],"this":[44],"gap,":[45],"we":[46],"make":[47],"first":[49],"attempt":[50],"to":[51,91,122,135],"propose":[52],"Margin":[53,70,100,108,149],"Trader,":[54],"an":[55],"innovative":[56],"adaptive":[58],"learning":[60],"framework":[61,89],"designed":[62],"for":[63,82],"trading":[65,80,154],"stock":[68],"market.":[69],"Trader":[71,109,150],"integrates":[72],"constraints":[76],"into":[77],"a":[78],"realistic":[79],"environment":[81],"both":[83,160],"long":[84],"positions.":[87],"The":[88],"aims":[90],"balance":[92],"profit":[93],"maximization":[94],"risk":[96,143],"through":[98],"Adjustment":[101],"Module":[102],"Maintenance":[105],"Detection":[106],"Module.":[107],"supports":[110],"various":[111],"Deep":[112],"Reinforcement":[113],"Learning":[114],"(DRL)":[115],"algorithms":[116],"offers":[118],"traders":[119],"flexibility":[121],"customize":[123],"critical":[124],"settings,":[125],"such":[126],"as":[127],"equity":[128],"allocation,":[129],"ratios,":[131],"maintenance":[133],"requirements,":[134],"suit":[136],"diverse":[137],"market":[138],"conditions,":[139],"individual":[140],"preferences,":[141],"tolerance.":[144],"Experimental":[145],"results":[146],"demonstrate":[147],"that":[148],"effectively":[151],"learns":[152],"profitable":[153],"strategies":[155],"hedges":[157],"bullish":[161],"bearish":[163],"markets,":[164],"outperforming":[165],"other":[166],"baseline":[167],"models":[168],"with":[169],"highest":[171],"Sharpe":[172],"ratio.":[173]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
