{"id":"https://openalex.org/W4206427807","doi":"https://doi.org/10.1109/bigdata52589.2021.9671687","title":"Deep Reinforcement Learning based Recommender System with State Representation","display_name":"Deep Reinforcement Learning based Recommender System with State Representation","publication_year":2021,"publication_date":"2021-12-15","ids":{"openalex":"https://openalex.org/W4206427807","doi":"https://doi.org/10.1109/bigdata52589.2021.9671687"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata52589.2021.9671687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata52589.2021.9671687","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001339397","display_name":"Peng Jiang","orcid":"https://orcid.org/0000-0002-9266-0780"},"institutions":[{"id":"https://openalex.org/I4210132079","display_name":"Hangzhou Wanxiang Polytechnic","ror":"https://ror.org/03sxnxp24","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210132079"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Peng Jiang","raw_affiliation_strings":["Polytechnic Institute, ZheJiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Polytechnic Institute, ZheJiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4210132079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061947114","display_name":"Jiafeng Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiafeng Ma","raw_affiliation_strings":["Colledge of Control Science and Engineering, ZheJiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Colledge of Control Science and Engineering, ZheJiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100427567","display_name":"Jianming Zhang","orcid":"https://orcid.org/0000-0002-5632-7315"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianming Zhang","raw_affiliation_strings":["Colledge of Control Science and Engineering, ZheJiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Colledge of Control Science and Engineering, ZheJiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5001339397"],"corresponding_institution_ids":["https://openalex.org/I4210132079"],"apc_list":null,"apc_paid":null,"fwci":0.8509,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.73486706,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"5703","last_page":"5707"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9065001010894775},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.8891869187355042},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8440985679626465},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6160686612129211},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5791510343551636},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5677449703216553},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5582752227783203},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5251410007476807},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5124998092651367},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.5004308223724365},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4915843904018402},{"id":"https://openalex.org/keywords/competition","display_name":"Competition (biology)","score":0.4885061979293823},{"id":"https://openalex.org/keywords/commodity","display_name":"Commodity","score":0.48059698939323425},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.46033912897109985},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42258235812187195},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4174412488937378},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0658600926399231}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9065001010894775},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.8891869187355042},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8440985679626465},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6160686612129211},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5791510343551636},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5677449703216553},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5582752227783203},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5251410007476807},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5124998092651367},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.5004308223724365},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4915843904018402},{"id":"https://openalex.org/C91306197","wikidata":"https://www.wikidata.org/wiki/Q45767","display_name":"Competition (biology)","level":2,"score":0.4885061979293823},{"id":"https://openalex.org/C2779439359","wikidata":"https://www.wikidata.org/wiki/Q317088","display_name":"Commodity","level":2,"score":0.48059698939323425},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.46033912897109985},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42258235812187195},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4174412488937378},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0658600926399231},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata52589.2021.9671687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata52589.2021.9671687","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.4300000071525574,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1975767384","https://openalex.org/W2012516036","https://openalex.org/W2056089161","https://openalex.org/W2119717200","https://openalex.org/W2135263912","https://openalex.org/W2746553466","https://openalex.org/W2787933113","https://openalex.org/W2799544270","https://openalex.org/W2809162153","https://openalex.org/W2898273872","https://openalex.org/W2902572901","https://openalex.org/W2999560001","https://openalex.org/W3102899483","https://openalex.org/W3195172987","https://openalex.org/W4294990489","https://openalex.org/W4301178047","https://openalex.org/W6653708959","https://openalex.org/W6685276911","https://openalex.org/W6746030470","https://openalex.org/W6755373136"],"related_works":["https://openalex.org/W2383111961","https://openalex.org/W2365952365","https://openalex.org/W2352448290","https://openalex.org/W4390273403","https://openalex.org/W2380820513","https://openalex.org/W4386781444","https://openalex.org/W2913146933","https://openalex.org/W2372385138","https://openalex.org/W4296359239","https://openalex.org/W2101155126"],"abstract_inverted_index":{"With":[0],"the":[1,9,26,37,49,62,97,105,110,119],"scale":[2],"of":[3,11,42,64,114],"E-commerce":[4],"increasing":[5,16],"year":[6],"by":[7,100],"year,":[8],"importance":[10],"recommender":[12,80],"systems":[13],"is":[14],"getting":[15],"attention.":[17],"Based":[18],"on":[19,83,96],"deep":[20,88],"reinforcement":[21,89],"learning,":[22,90],"we":[23,77],"can":[24,47,71],"model":[25],"recommendation":[27,50],"task":[28],"as":[29],"an":[30],"interactional":[31],"and":[32,39,69,93,104],"sequential":[33],"decision":[34],"procedure":[35],"between":[36,67],"system":[38,70,81],"users,":[40],"instead":[41],"a":[43,53,58,79],"static":[44],"process.":[45],"It":[46],"improve":[48],"quality":[51,63],"to":[52],"large":[54],"extent.":[55],"By":[56],"integrating":[57],"state":[59,85],"representation":[60,86],"module,":[61],"modeling":[65],"interaction":[66],"users":[68],"be":[72],"improved.":[73],"In":[74],"this":[75],"article,":[76],"propose":[78],"based":[82],"user-commodity":[84],"integrated":[87],"named":[91],"UCSRDRL,":[92],"conduct":[94],"experiments":[95],"datasets":[98],"offered":[99],"FUXI":[101],"AI":[102],"Lab":[103],"outcome":[106],"performs":[107],"better":[108],"than":[109],"baseline.":[111],"The":[112],"score":[113],"UCSRDRL":[115],"ranked":[116],"third":[117],"in":[118],"competition.":[120]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
