{"id":"https://openalex.org/W4284708436","doi":"https://doi.org/10.1145/3477495.3532021","title":"MGPolicy","display_name":"MGPolicy","publication_year":2022,"publication_date":"2022-07-06","ids":{"openalex":"https://openalex.org/W4284708436","doi":"https://doi.org/10.1145/3477495.3532021"},"language":"en","primary_location":{"id":"doi:10.1145/3477495.3532021","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3532021","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010481978","display_name":"Xiangmeng Wang","orcid":"https://orcid.org/0000-0003-3643-3353"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Xiangmeng Wang","raw_affiliation_strings":["University of Technology Sydney, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100340627","display_name":"Qian Li","orcid":"https://orcid.org/0000-0002-8308-9551"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Qian Li","raw_affiliation_strings":["Curtin University, Perth, WA, Australia"],"affiliations":[{"raw_affiliation_string":"Curtin University, Perth, WA, Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067132374","display_name":"Dianer Yu","orcid":"https://orcid.org/0000-0001-6376-9667"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Dianer Yu","raw_affiliation_strings":["University of Technology Sydney, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398378","display_name":"Zhichao Wang","orcid":"https://orcid.org/0009-0004-8481-4497"},"institutions":[{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Zhichao Wang","raw_affiliation_strings":["University of New South Wales, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of New South Wales, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I31746571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009606065","display_name":"Hongxu Chen","orcid":"https://orcid.org/0000-0001-7963-8813"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Hongxu Chen","raw_affiliation_strings":["University of Technology Sydney, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051512158","display_name":"Guandong Xu","orcid":"https://orcid.org/0000-0003-4493-6663"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Guandong Xu","raw_affiliation_strings":["University of Technology Sydney, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I114017466"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5010481978"],"corresponding_institution_ids":["https://openalex.org/I114017466"],"apc_list":null,"apc_paid":null,"fwci":1.0186,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.78538283,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1369","last_page":"1378"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9620000123977661,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6869384050369263},{"id":"https://openalex.org/keywords/policy-learning","display_name":"Policy learning","score":0.6391729712486267},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6301476359367371},{"id":"https://openalex.org/keywords/logging","display_name":"Logging","score":0.4762858748435974},{"id":"https://openalex.org/keywords/propensity-score-matching","display_name":"Propensity score matching","score":0.4665500819683075},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.45972034335136414},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4107821583747864},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4102296531200409},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10809725522994995},{"id":"https://openalex.org/keywords/forestry","display_name":"Forestry","score":0.09526881575584412},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08275598287582397}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6869384050369263},{"id":"https://openalex.org/C2779436431","wikidata":"https://www.wikidata.org/wiki/Q30672407","display_name":"Policy learning","level":2,"score":0.6391729712486267},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6301476359367371},{"id":"https://openalex.org/C125620115","wikidata":"https://www.wikidata.org/wiki/Q845249","display_name":"Logging","level":2,"score":0.4762858748435974},{"id":"https://openalex.org/C17923572","wikidata":"https://www.wikidata.org/wiki/Q7250160","display_name":"Propensity score matching","level":2,"score":0.4665500819683075},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.45972034335136414},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4107821583747864},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4102296531200409},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10809725522994995},{"id":"https://openalex.org/C97137747","wikidata":"https://www.wikidata.org/wiki/Q38112","display_name":"Forestry","level":1,"score":0.09526881575584412},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08275598287582397},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3477495.3532021","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3532021","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6537946155","display_name":null,"funder_award_id":"DP220103717","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"}],"funders":[{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1881549354","https://openalex.org/W2146502635","https://openalex.org/W2159309155","https://openalex.org/W2354939339","https://openalex.org/W2483962956","https://openalex.org/W2743159750","https://openalex.org/W2788295351","https://openalex.org/W2884134047","https://openalex.org/W2902572901","https://openalex.org/W2911286998","https://openalex.org/W2943864248","https://openalex.org/W2966501701","https://openalex.org/W2996959725","https://openalex.org/W2997352934","https://openalex.org/W2999693458","https://openalex.org/W3012871709","https://openalex.org/W3012881846","https://openalex.org/W3020940496","https://openalex.org/W3022972087","https://openalex.org/W3034833075","https://openalex.org/W3084805822","https://openalex.org/W3093482530","https://openalex.org/W3102778384","https://openalex.org/W3200739262","https://openalex.org/W3201286590","https://openalex.org/W3205333154","https://openalex.org/W4225356279","https://openalex.org/W4233415207","https://openalex.org/W4299689471"],"related_works":["https://openalex.org/W2026576563","https://openalex.org/W3196761963","https://openalex.org/W213628847","https://openalex.org/W2036193982","https://openalex.org/W3023923059","https://openalex.org/W4232168831","https://openalex.org/W2065417422","https://openalex.org/W4253956144","https://openalex.org/W2275925001","https://openalex.org/W3018339811"],"abstract_inverted_index":{"Off-policy":[0],"learning":[1,16,25,47],"has":[2],"drawn":[3],"huge":[4],"attention":[5],"in":[6],"recommender":[7],"systems":[8],"(RS),":[9],"which":[10,54],"provides":[11],"an":[12],"opportunity":[13],"for":[14],"reinforcement":[15],"to":[17,49,57,68],"abandon":[18],"the":[19,33,37,41],"expensive":[20],"online":[21],"training.":[22],"However,":[23],"off-policy":[24,46],"from":[26],"logged":[27],"data":[28],"suffers":[29],"biases":[30],"caused":[31],"by":[32],"policy":[34,39],"shift":[35],"between":[36],"target":[38],"and":[40,65],"logging":[42],"policy.":[43],"Consequently,":[44],"most":[45],"resorts":[48],"inverse":[50],"propensity":[51],"scoring":[52],"(IPS)":[53],"however":[55],"tends":[56],"be":[58],"over-fitted":[59],"over":[60],"exposed":[61],"(or":[62],"recommended)":[63],"items":[64],"thus":[66],"fails":[67],"explore":[69],"unexposed":[70],"items.":[71]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2022-07-08T00:00:00"}
