{"id":"https://openalex.org/W4385283510","doi":"https://doi.org/10.1109/access.2023.3298821","title":"Multi-Feature Supervised Reinforcement Learning for Stock Trading","display_name":"Multi-Feature Supervised Reinforcement Learning for Stock Trading","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4385283510","doi":"https://doi.org/10.1109/access.2023.3298821"},"language":"en","primary_location":{"id":"doi:10.1109/access.2023.3298821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3298821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/10005208/10195852.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/10005208/10195852.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005875631","display_name":"Kui Fu","orcid":"https://orcid.org/0000-0001-9313-7820"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Kui Fu","raw_affiliation_strings":["School of Economics, Wuhan University of Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Economics, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114069755","display_name":"Yidong Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yidong Yu","raw_affiliation_strings":["School of Economics, Wuhan University of Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Economics, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100451251","display_name":"Bing Li","orcid":"https://orcid.org/0000-0002-1875-2919"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Li","raw_affiliation_strings":["School of Economics, Wuhan University of Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Economics, Wuhan University of Technology, Wuhan, China","institution_ids":["https://openalex.org/I196699116"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5005875631"],"corresponding_institution_ids":["https://openalex.org/I196699116"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":4.6,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.94985234,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"11","issue":null,"first_page":"77840","last_page":"77855"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10047","display_name":"Financial Markets and Investment Strategies","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11052","display_name":"Energy Load and Power Forecasting","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9292964935302734},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7215573787689209},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6481871604919434},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5838034152984619},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.5506769418716431},{"id":"https://openalex.org/keywords/learning-classifier-system","display_name":"Learning classifier system","score":0.5351147651672363},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.5252125859260559},{"id":"https://openalex.org/keywords/profit","display_name":"Profit (economics)","score":0.48971131443977356},{"id":"https://openalex.org/keywords/trading-strategy","display_name":"Trading strategy","score":0.4836619794368744},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4696962833404541},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4531136751174927},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.4331985116004944},{"id":"https://openalex.org/keywords/stock-market","display_name":"Stock market","score":0.42509356141090393},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.41904953122138977},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4144021272659302},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.13516965508460999},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1209544837474823}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9292964935302734},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7215573787689209},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6481871604919434},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5838034152984619},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.5506769418716431},{"id":"https://openalex.org/C199190896","wikidata":"https://www.wikidata.org/wiki/Q3509276","display_name":"Learning classifier system","level":3,"score":0.5351147651672363},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.5252125859260559},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.48971131443977356},{"id":"https://openalex.org/C131562839","wikidata":"https://www.wikidata.org/wiki/Q1574928","display_name":"Trading strategy","level":2,"score":0.4836619794368744},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4696962833404541},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4531136751174927},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.4331985116004944},{"id":"https://openalex.org/C2780299701","wikidata":"https://www.wikidata.org/wiki/Q475000","display_name":"Stock market","level":3,"score":0.42509356141090393},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.41904953122138977},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4144021272659302},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.13516965508460999},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1209544837474823},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C2780762169","wikidata":"https://www.wikidata.org/wiki/Q5905368","display_name":"Horse","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2023.3298821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3298821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/10005208/10195852.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:457f46fbffcf4d84900a791192128506","is_oa":true,"landing_page_url":"https://doaj.org/article/457f46fbffcf4d84900a791192128506","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 11, Pp 77840-77855 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2023.3298821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3298821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/10005208/10195852.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1880457144","display_name":null,"funder_award_id":"72004174","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385283510.pdf","grobid_xml":"https://content.openalex.org/works/W4385283510.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1595982529","https://openalex.org/W1641379095","https://openalex.org/W1689711448","https://openalex.org/W2024998154","https://openalex.org/W2055208286","https://openalex.org/W2095487261","https://openalex.org/W2133641513","https://openalex.org/W2140360763","https://openalex.org/W2145339207","https://openalex.org/W2785336079","https://openalex.org/W2897733922","https://openalex.org/W2903947336","https://openalex.org/W2963864421","https://openalex.org/W2970489962","https://openalex.org/W2976581604","https://openalex.org/W3015954380","https://openalex.org/W3048630347","https://openalex.org/W3049045648","https://openalex.org/W3134206323","https://openalex.org/W3151614082","https://openalex.org/W3153842551","https://openalex.org/W3195975917","https://openalex.org/W3202007446","https://openalex.org/W4220747123","https://openalex.org/W4233840023","https://openalex.org/W4256431242","https://openalex.org/W4285178744","https://openalex.org/W4302570325","https://openalex.org/W4311923926","https://openalex.org/W4322765652","https://openalex.org/W4382175553","https://openalex.org/W6635603806","https://openalex.org/W6684205842","https://openalex.org/W6684921986","https://openalex.org/W6766807222"],"related_works":["https://openalex.org/W26063614","https://openalex.org/W3140225428","https://openalex.org/W235959167","https://openalex.org/W2610686804","https://openalex.org/W2141149254","https://openalex.org/W3148138296","https://openalex.org/W2766258251","https://openalex.org/W2313756439","https://openalex.org/W4405211738","https://openalex.org/W1987864653"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1,52,79],"learning":[2,43,53,80,100,118],"(DRL)":[3],"algorithm":[4,127,147],"is":[5,22,109],"often":[6],"used":[7],"to":[8,24,111,114],"find":[9],"the":[10,18,29,33,82,96,112,116,120,139],"best":[11],"trading":[12,159],"strategy":[13,59],"in":[14,40,78,81,137],"algorithmic":[15],"trading.":[16],"However,":[17],"classical":[19],"DRL":[20,42],"model":[21,113],"difficult":[23],"achieve":[25],"rapid":[26],"convergence,":[27],"and":[28,70,101,142,151,157],"features":[30],"extracted":[31],"from":[32],"market":[34],"data":[35],"are":[36],"relatively":[37],"simple,":[38],"resulting":[39],"incomplete":[41],"information.":[44],"In":[45,104],"this":[46],"paper,":[47],"we":[48],"propose":[49],"a":[50,55],"supervised":[51,86],"method,":[54],"hybrid":[56],"optimal":[57],"investment":[58],"formation":[60],"method":[61],"consisting":[62],"of":[63,85,98,119],"long":[64],"short-term":[65],"memory":[66],"neural":[67],"network":[68],"(LSTM)":[69],"deep":[71],"deterministic":[72],"policy":[73],"gradient":[74],"(DDPG).":[75],"By":[76],"participating":[77],"early":[83],"stage":[84],"learning,":[87],"agents":[88],"can":[89],"obtain":[90],"guiding":[91],"prior":[92],"experience,":[93],"thus":[94],"reducing":[95],"cost":[97],"agent":[99],"accelerating":[102],"convergence.":[103],"addition,":[105],"multi-feature":[106],"state":[107],"input":[108],"added":[110],"optimize":[115],"agent\u2019s":[117],"environment.":[121],"Compared":[122],"with":[123],"DDPG":[124],"algorithm,":[125],"LSTM-DDPG":[126,146],"achieves":[128],"convergence":[129],"faster.":[130],"Experiments":[131],"on":[132],"three":[133],"regional":[134],"stock":[135],"markets":[136],"China,":[138],"United":[140],"States":[141],"Europe":[143],"show":[144],"that":[145],"has":[148],"higher":[149],"profit":[150],"lower":[152],"risk":[153],"than":[154],"B&H,":[155],"MACD":[156],"LSTM":[158],"strategies.":[160]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":6}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
