{"id":"https://openalex.org/W2734694041","doi":"https://doi.org/10.1109/ijcnn.2017.7965958","title":"Risk-averse trees for learning from logged bandit feedback","display_name":"Risk-averse trees for learning from logged bandit feedback","publication_year":2017,"publication_date":"2017-05-01","ids":{"openalex":"https://openalex.org/W2734694041","doi":"https://doi.org/10.1109/ijcnn.2017.7965958","mag":"2734694041"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2017.7965958","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2017.7965958","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039887680","display_name":"Francesco Trov\u00f2","orcid":"https://orcid.org/0000-0001-5796-7667"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Francesco Trovo","raw_affiliation_strings":["Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051831790","display_name":"Stefano Paladino","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Stefano Paladino","raw_affiliation_strings":["Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065733742","display_name":"Paolo De Simone","orcid":"https://orcid.org/0000-0001-6713-6170"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Paolo Simone","raw_affiliation_strings":["Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017130830","display_name":"Marcello Restelli","orcid":"https://orcid.org/0000-0002-6322-1076"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marcello Restelli","raw_affiliation_strings":["Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060367013","display_name":"Nicola Gatti","orcid":"https://orcid.org/0000-0001-7349-3932"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Nicola Gatti","raw_affiliation_strings":["Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartirnento di Elettronica, Informazione e Bioingegneria, Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5039887680"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.2583,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.61715105,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"1","issue":null,"first_page":"976","last_page":"983"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7958077192306519},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6942228674888611},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6790758371353149},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6622403264045715},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6118504405021667},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5901194214820862},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5397428274154663},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4537929594516754},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4477599859237671},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10323616862297058}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7958077192306519},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6942228674888611},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6790758371353149},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6622403264045715},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6118504405021667},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5901194214820862},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5397428274154663},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4537929594516754},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4477599859237671},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10323616862297058},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ijcnn.2017.7965958","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2017.7965958","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1032235","is_oa":false,"landing_page_url":"http://hdl.handle.net/11311/1032235","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5899999737739563,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W8722571","https://openalex.org/W1487320471","https://openalex.org/W1587157779","https://openalex.org/W1601795611","https://openalex.org/W1677912466","https://openalex.org/W1835900096","https://openalex.org/W2010657328","https://openalex.org/W2020160576","https://openalex.org/W2039522160","https://openalex.org/W2092092836","https://openalex.org/W2099302642","https://openalex.org/W2103012681","https://openalex.org/W2112420033","https://openalex.org/W2142971854","https://openalex.org/W2164831377","https://openalex.org/W2168405694","https://openalex.org/W2182000050","https://openalex.org/W2187360726","https://openalex.org/W2251567929","https://openalex.org/W2375650553","https://openalex.org/W2911964244","https://openalex.org/W2950382198","https://openalex.org/W2989661724","https://openalex.org/W4205431832","https://openalex.org/W4233413206","https://openalex.org/W4234228486","https://openalex.org/W4246484440","https://openalex.org/W6629353124","https://openalex.org/W6638427827","https://openalex.org/W6673363407","https://openalex.org/W6684171789","https://openalex.org/W6686227676","https://openalex.org/W6687281654"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W1590307681","https://openalex.org/W2536018345","https://openalex.org/W4312814274","https://openalex.org/W4384470695","https://openalex.org/W3134840015","https://openalex.org/W3036095178","https://openalex.org/W4366979180"],"abstract_inverted_index":{"Logged":[0,105],"data":[1],"is":[2,65,99],"one":[3],"of":[4,9,42,71,83,136,169],"the":[5,28,32,40,50,56,97,102,121,133,161,173,177,179,212],"most":[6],"widespread":[7],"form":[8],"recorded":[10],"information,":[11],"since":[12],"it":[13],"can":[14],"be":[15],"acquired":[16],"by":[17],"almost":[18],"any":[19],"system":[20,33,51],"and":[21,34,55,78,124,139,164,191,205,208],"stored":[22],"at":[23],"a":[24,35,43,48,59,68,85,127,157,166,184],"little":[25],"cost.":[26],"Customarily,":[27],"interaction":[29],"logs":[30],"between":[31],"user":[36,57],"(or":[37],"environment)":[38],"present":[39],"structure":[41,64],"sequential":[44],"decision":[45],"process:":[46],"given":[47],"context,":[49],"performs":[52],"an":[53,116],"action":[54],"provides":[58,165],"feedback":[60],"about":[61],"it.":[62],"This":[63],"common":[66],"to":[67,91,155],"wide":[69,185],"range":[70],"real-world":[72,192],"micro-economic":[73],"applications,":[74],"e.g.,":[75],"e-commerce":[76],"websites":[77],"advertisement":[79],"campaigns.":[80],"The":[81],"problem":[82],"learning":[84,129,203],"policy":[86],"from":[87,104,144],"such":[88],"logged":[89],"interactions":[90],"take":[92],"more":[93],"profitable":[94],"decisions":[95],"in":[96,172],"future":[98],"known":[100],"as":[101],"Learning":[103],"Bandit":[106],"Feedback":[107],"(LLBF)":[108],"problem.":[109],"In":[110],"this":[111,149],"paper,":[112],"we":[113,182],"propose":[114],"RADT,":[115],"algorithm":[117],"specifically":[118],"shaped":[119],"for":[120,148],"LLBF":[122,213],"setting":[123],"based":[125],"on":[126,160],"risk-averse":[128],"method":[130],"which":[131],"exploits":[132],"joint":[134],"use":[135],"regression":[137,206],"trees":[138],"statistical":[140],"confidence":[141],"bounds.":[142],"Differently":[143],"existing":[145,209],"techniques":[146,207],"developed":[147],"setting,":[150],"RADT":[151,198],"generates":[152],"policies":[153],"aiming":[154],"maximize":[156],"lower":[158],"bound":[159],"expected":[162],"reward":[163],"clear":[167],"characterization":[168],"those":[170],"features":[171],"context":[174],"that":[175,197],"influence":[176],"process":[178],"most.":[180],"Finally,":[181],"provide":[183],"experimental":[186],"campaign":[187],"over":[188],"both":[189,200],"synthetic":[190],"datasets":[193],"showing":[194],"empirical":[195],"evidence":[196],"outperforms":[199],"state-of-the-art":[201],"machine":[202],"classification":[204],"methods":[210],"addressing":[211],"setting.":[214]},"counts_by_year":[{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
