{"id":"https://openalex.org/W2100415632","doi":"https://doi.org/10.48550/arxiv.2604.24555","title":"Efficient learning by implicit exploration in bandit problems with side observations","display_name":"Efficient learning by implicit exploration in bandit problems with side observations","publication_year":2026,"publication_date":"2026-04-27","ids":{"openalex":"https://openalex.org/W2100415632","doi":"https://doi.org/10.48550/arxiv.2604.24555","mag":"2100415632"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2604.24555","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2604.24555","pdf_url":"https://arxiv.org/pdf/2604.24555","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2604.24555","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071092378","display_name":"Tom\u00e1\u0161 Koc\u00e1k","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kocak, Tomas","raw_affiliation_strings":["SEQUEL - Sequential Learning (France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"SEQUEL - Sequential Learning (France)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077167635","display_name":"Gergely Neu","orcid":"https://orcid.org/0000-0001-6287-3796"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neu, Gergely","raw_affiliation_strings":["SEQUEL - Sequential Learning (France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"SEQUEL - Sequential Learning (France)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106038276","display_name":"Michal Valko","orcid":"https://orcid.org/0009-0007-8593-7765"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Valko, Michal","raw_affiliation_strings":["SEQUEL - Sequential Learning (France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"SEQUEL - Sequential Learning (France)","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016419651","display_name":"R\u00e9mi Munos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Munos, Remi","raw_affiliation_strings":["SEQUEL - Sequential Learning (France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"SEQUEL - Sequential Learning (France)","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":130,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.8437670469284058},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.8260968327522278},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7452964782714844},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.48888128995895386},{"id":"https://openalex.org/keywords/online-learning","display_name":"Online learning","score":0.4867834746837616},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.436029314994812},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42433416843414307},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3272692561149597},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3212428689002991},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1677769124507904}],"concepts":[{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.8437670469284058},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.8260968327522278},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7452964782714844},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.48888128995895386},{"id":"https://openalex.org/C2986087404","wikidata":"https://www.wikidata.org/wiki/Q15946010","display_name":"Online learning","level":2,"score":0.4867834746837616},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.436029314994812},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42433416843414307},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3272692561149597},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3212428689002991},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1677769124507904},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"pmh:oai:arXiv.org:2604.24555","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2604.24555","pdf_url":"https://arxiv.org/pdf/2604.24555","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:lilloa.univ-lille.fr:20.500.12210/25821","is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.12210/25821","pdf_url":"http://hdl.handle.net/20.500.12210/25821","source":{"id":"https://openalex.org/S4306402203","display_name":"LillOA (Universit\u00e9 de Lille (University Of Lille))","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210123514","host_organization_name":"Centre d'Etudes en Civilisations, Langues et Litt\u00e9ratures Etrang\u00e8res","host_organization_lineage":["https://openalex.org/I4210123514"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:HAL:hal-01079351v2","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-01079351","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Neural Information Processing Systems, Dec 2014, Montr\u00e9al, Canada","raw_type":"Conference papers"},{"id":"doi:10.48550/arxiv.2604.24555","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24555","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2604.24555","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2604.24555","pdf_url":"https://arxiv.org/pdf/2604.24555","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.550000011920929,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1222903755","display_name":null,"funder_award_id":"270327","funder_id":"https://openalex.org/F4320322727","funder_display_name":"Minist\u00e8re de l'Education Nationale, de l'Enseignement Superieur et de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320322727","display_name":"Minist\u00e8re de l'Education Nationale, de l'Enseignement Superieur et de la Recherche","ror":"https://ror.org/03sjk9a61"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2100415632.pdf","grobid_xml":"https://content.openalex.org/works/W2100415632.grobid-xml"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W35251828","https://openalex.org/W1561097743","https://openalex.org/W1570963478","https://openalex.org/W1647316391","https://openalex.org/W1979675141","https://openalex.org/W2055639053","https://openalex.org/W2077902449","https://openalex.org/W2093825590","https://openalex.org/W2129962685","https://openalex.org/W2137905700","https://openalex.org/W2152898676","https://openalex.org/W2152951864","https://openalex.org/W2169401877","https://openalex.org/W2611627047","https://openalex.org/W2914156981","https://openalex.org/W2963389158"],"related_works":["https://openalex.org/W2046459260","https://openalex.org/W2971351794","https://openalex.org/W4376155396","https://openalex.org/W2967463586","https://openalex.org/W1947085858","https://openalex.org/W2765830098","https://openalex.org/W1971989957","https://openalex.org/W2101991911","https://openalex.org/W2963351290","https://openalex.org/W3041944716"],"abstract_inverted_index":{"We":[0],"consider":[1],"online":[2,104],"learning":[3],"problems":[4,107],"under":[5],"a":[6,59,97,156,166],"partial":[7,99],"observability":[8],"model":[9],"capturing":[10],"situations":[11],"where":[12,108],"the":[13,17,27,39,55,65,72,84,109,113,122,145,153,190],"information":[14,22,100],"conveyed":[15],"to":[16,35,43,82,176],"learner":[18,40,114],"is":[19,115,174],"between":[20,116],"full":[21,119],"and":[23,58,118,143,182],"bandit":[24],"feedback.":[25,120],"In":[26],"simplest":[28],"variant,":[29],"we":[30,70,94,136],"assume":[31],"that":[32,75,102],"in":[33,133],"addition":[34],"its":[36,89],"own":[37],"loss,":[38],"also":[41,95],"gets":[42],"observe":[44],"losses":[45,52],"of":[46,124,147,155],"some":[47],"other":[48],"actions.":[49,90],"The":[50],"revealed":[51],"depend":[53],"on":[54,165],"learner's":[56],"action":[57],"directed":[60],"observation":[61,85],"system":[62,86],"chosen":[63],"by":[64,112],"environment.":[66],"For":[67],"this":[68,134],"setting,":[69,135],"propose":[71,137],"first":[73,126],"algorithm":[74,127,139],"enjoys":[76],"near-optimal":[77],"regret":[78],"guarantees":[79],"without":[80],"having":[81],"know":[83],"before":[87],"selecting":[88],"Along":[91],"similar":[92,141],"lines,":[93],"define":[96],"new":[98],"setting":[101],"models":[103],"combinatorial":[105],"optimization":[106],"feedback":[110],"received":[111],"semi-bandit":[117],"As":[121],"predictions":[123],"our":[125],"cannot":[128],"be":[129,177],"always":[130,148],"computed":[131],"efficiently":[132],"another":[138],"with":[140,144],"properties":[142],"benefit":[146],"being":[149],"computationally":[150,181],"efficient,":[151],"at":[152],"price":[154],"slightly":[157],"more":[158,178],"complicated":[159],"tuning":[160],"mechanism.":[161],"Both":[162],"algorithms":[163],"rely":[164],"novel":[167],"exploration":[168,187],"strategy":[169],"called":[170],"implicit":[171],"exploration,":[172],"which":[173],"shown":[175],"efficient":[179],"both":[180],"information-theoretically":[183],"than":[184],"previously":[185],"studied":[186],"strategies":[188],"for":[189],"problem.":[191]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":63},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":9}],"updated_date":"2026-06-14T07:44:22.658603","created_date":"2016-06-24T00:00:00"}
