{"id":"https://openalex.org/W2890951405","doi":"https://doi.org/10.1609/aaai.v33i01.33014634","title":"Efficient Counterfactual Learning from Bandit Feedback","display_name":"Efficient Counterfactual Learning from Bandit Feedback","publication_year":2019,"publication_date":"2019-07-17","ids":{"openalex":"https://openalex.org/W2890951405","doi":"https://doi.org/10.1609/aaai.v33i01.33014634","mag":"2890951405"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v33i01.33014634","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33014634","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4388/4266","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4388/4266","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102762244","display_name":"Yusuke Narita","orcid":"https://orcid.org/0000-0003-0314-3384"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yusuke Narita","raw_affiliation_strings":["Yale University"],"affiliations":[{"raw_affiliation_string":"Yale University","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033866977","display_name":"Shota Yasui","orcid":null},"institutions":[{"id":"https://openalex.org/I4210089607","display_name":"CyberAgent (Japan)","ror":"https://ror.org/0060jg679","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210089607"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shota Yasui","raw_affiliation_strings":["Cyberagent"],"affiliations":[{"raw_affiliation_string":"Cyberagent","institution_ids":["https://openalex.org/I4210089607"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028705026","display_name":"Kohei Yata","orcid":null},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kohei Yata","raw_affiliation_strings":["Yale University"],"affiliations":[{"raw_affiliation_string":"Yale University","institution_ids":["https://openalex.org/I32971472"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102762244"],"corresponding_institution_ids":["https://openalex.org/I32971472"],"apc_list":null,"apc_paid":null,"fwci":7.8557,"has_fulltext":true,"cited_by_count":24,"citation_normalized_percentile":{"value":0.98042553,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"33","issue":"01","first_page":"4634","last_page":"4641"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9751999974250793,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.9314343929290771},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.9051192998886108},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7965857982635498},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.6376193165779114},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.574158787727356},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5304459929466248},{"id":"https://openalex.org/keywords/variance-reduction","display_name":"Variance reduction","score":0.5296632647514343},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.4137246608734131},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3465186357498169},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.30820000171661377},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2910842001438141},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28671836853027344},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.20625987648963928},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.0698007345199585},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.06198641657829285}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.9314343929290771},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.9051192998886108},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7965857982635498},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.6376193165779114},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.574158787727356},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5304459929466248},{"id":"https://openalex.org/C62644790","wikidata":"https://www.wikidata.org/wiki/Q3454689","display_name":"Variance reduction","level":3,"score":0.5296632647514343},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.4137246608734131},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3465186357498169},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.30820000171661377},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2910842001438141},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28671836853027344},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.20625987648963928},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0698007345199585},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.06198641657829285},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v33i01.33014634","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33014634","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4388/4266","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v33i01.33014634","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33014634","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4388/4266","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.4399999976158142,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320335125","display_name":"RIKEN","ror":"https://ror.org/01sjwvz98"},{"id":"https://openalex.org/F4320337253","display_name":"Instituto de Ciencias del Mar y Limnolog\u00eda, Universidad Nacional Aut\u00f3noma de M\u00e9xico","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2890951405.pdf","grobid_xml":"https://content.openalex.org/works/W2890951405.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W191658262","https://openalex.org/W340056678","https://openalex.org/W1520595697","https://openalex.org/W1581503202","https://openalex.org/W1835900096","https://openalex.org/W1963509555","https://openalex.org/W1968694834","https://openalex.org/W1998427280","https://openalex.org/W1998833647","https://openalex.org/W2001947543","https://openalex.org/W2012455789","https://openalex.org/W2112420033","https://openalex.org/W2113065326","https://openalex.org/W2119711634","https://openalex.org/W2122124659","https://openalex.org/W2138909795","https://openalex.org/W2139345360","https://openalex.org/W2150291618","https://openalex.org/W2163150561","https://openalex.org/W2165959378","https://openalex.org/W2186512312","https://openalex.org/W2188353343","https://openalex.org/W2208550830","https://openalex.org/W2273088453","https://openalex.org/W2295739661","https://openalex.org/W2340679559","https://openalex.org/W2406454855","https://openalex.org/W2411690432","https://openalex.org/W2560740065","https://openalex.org/W2768362151","https://openalex.org/W2963323139","https://openalex.org/W2963674921","https://openalex.org/W3098679278","https://openalex.org/W3104349857","https://openalex.org/W3121902842","https://openalex.org/W3122193054","https://openalex.org/W4233216783","https://openalex.org/W4233471163","https://openalex.org/W4293653493","https://openalex.org/W4298101950","https://openalex.org/W4299939605","https://openalex.org/W6607764300","https://openalex.org/W6631330672","https://openalex.org/W6677102192","https://openalex.org/W6694250863","https://openalex.org/W6697546013","https://openalex.org/W7056075746"],"related_works":["https://openalex.org/W4225573578","https://openalex.org/W3122602933","https://openalex.org/W2380964641","https://openalex.org/W2950038056","https://openalex.org/W1544940847","https://openalex.org/W2169816622","https://openalex.org/W2289285490","https://openalex.org/W3031816500","https://openalex.org/W2298254442","https://openalex.org/W2169367269"],"abstract_inverted_index":{"What":[0],"is":[1],"the":[2,30,74,84],"most":[3],"statistically":[4],"efficient":[5],"way":[6],"to":[7,41,55,63,81,93],"do":[8],"off-policy":[9],"optimization":[10],"with":[11,73,88],"batch":[12],"data":[13,19],"from":[14,33],"bandit":[15,23,86],"feedback?":[16],"For":[17],"log":[18],"generated":[20],"by":[21,67],"contextual":[22],"algorithms,":[24],"we":[25],"consider":[26],"offline":[27],"estimators":[28,38,62,78],"for":[29],"expected":[31],"reward":[32],"a":[34,46,68,94],"counterfactual":[35],"policy.":[36],"Our":[37],"are":[39],"shown":[40],"have":[42],"lowest":[43],"variance":[44,52],"in":[45],"wide":[47],"class":[48],"of":[49],"estimators,":[50],"achieving":[51],"reduction":[53],"relative":[54],"standard":[56],"estimators.":[57],"We":[58],"then":[59],"apply":[60],"our":[61,77],"improve":[64,82],"advertisement":[65,70],"design":[66],"major":[69],"company.":[71],"Consistent":[72],"theoretical":[75],"result,":[76],"allow":[79],"us":[80],"on":[83],"existing":[85],"algorithm":[87],"more":[89],"statistical":[90],"confidence":[91],"compared":[92],"state-of-theart":[95],"benchmark.":[96]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":10},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
