{"id":"https://openalex.org/W4285606081","doi":"https://doi.org/10.24963/ijcai.2022/472","title":"Multi-Armed Bandit Problem with Temporally-Partitioned Rewards: When Partial Feedback Counts","display_name":"Multi-Armed Bandit Problem with Temporally-Partitioned Rewards: When Partial Feedback Counts","publication_year":2022,"publication_date":"2022-07-01","ids":{"openalex":"https://openalex.org/W4285606081","doi":"https://doi.org/10.24963/ijcai.2022/472"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2022/472","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/472","pdf_url":"https://www.ijcai.org/proceedings/2022/0472.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.ijcai.org/proceedings/2022/0472.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002705366","display_name":"Giulia Romano","orcid":"https://orcid.org/0000-0002-2961-4538"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Giulia Romano","raw_affiliation_strings":["Politecnico di Milano","Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101069381","display_name":"Andrea Agostini","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Agostini","raw_affiliation_strings":["Politecnico di Milano","Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039887680","display_name":"Francesco Trov\u00f2","orcid":"https://orcid.org/0000-0001-5796-7667"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Francesco Trov\u00f2","raw_affiliation_strings":["Politecnico di Milano","Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060367013","display_name":"Nicola Gatti","orcid":"https://orcid.org/0000-0001-7349-3932"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Nicola Gatti","raw_affiliation_strings":["Politecnico di Milano","Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017130830","display_name":"Marcello Restelli","orcid":"https://orcid.org/0000-0002-6322-1076"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marcello Restelli","raw_affiliation_strings":["Politecnico di Milano","Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano, Piazza Leonardo da Vinci 32, I-20133, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5002705366"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.5148,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.54097483,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3401","last_page":"3407"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.8246564865112305},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7266563773155212},{"id":"https://openalex.org/keywords/smoothness","display_name":"Smoothness","score":0.624542236328125},{"id":"https://openalex.org/keywords/multi-armed-bandit","display_name":"Multi-armed bandit","score":0.58796226978302},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5644731521606445},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.562139630317688},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.47604870796203613},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.45295581221580505},{"id":"https://openalex.org/keywords/active-listening","display_name":"Active listening","score":0.4244329631328583},{"id":"https://openalex.org/keywords/finite-set","display_name":"Finite set","score":0.4224092364311218},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.4109501838684082},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.33200961351394653},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32406890392303467},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2798231244087219},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1780775785446167}],"concepts":[{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.8246564865112305},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7266563773155212},{"id":"https://openalex.org/C102634674","wikidata":"https://www.wikidata.org/wiki/Q868473","display_name":"Smoothness","level":2,"score":0.624542236328125},{"id":"https://openalex.org/C123197309","wikidata":"https://www.wikidata.org/wiki/Q2882343","display_name":"Multi-armed bandit","level":3,"score":0.58796226978302},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5644731521606445},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.562139630317688},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.47604870796203613},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.45295581221580505},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.4244329631328583},{"id":"https://openalex.org/C162392398","wikidata":"https://www.wikidata.org/wiki/Q272404","display_name":"Finite set","level":2,"score":0.4224092364311218},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.4109501838684082},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.33200961351394653},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32406890392303467},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2798231244087219},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1780775785446167},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.24963/ijcai.2022/472","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/472","pdf_url":"https://www.ijcai.org/proceedings/2022/0472.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1231823","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1231823","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2022/472","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2022/472","pdf_url":"https://www.ijcai.org/proceedings/2022/0472.pdf","source":{"id":"https://openalex.org/S4363608755","display_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4285606081.pdf","grobid_xml":"https://content.openalex.org/works/W4285606081.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W2000850397","https://openalex.org/W2049934117","https://openalex.org/W2118980425","https://openalex.org/W2295316671","https://openalex.org/W2616619952","https://openalex.org/W2730527299","https://openalex.org/W2788991205","https://openalex.org/W2801206439","https://openalex.org/W2911829170","https://openalex.org/W2950290000","https://openalex.org/W2971268960","https://openalex.org/W3010048053","https://openalex.org/W3025710735","https://openalex.org/W3035116197","https://openalex.org/W4221161271","https://openalex.org/W4225733870","https://openalex.org/W4226074292","https://openalex.org/W4287765290","https://openalex.org/W4287957631","https://openalex.org/W4288337043","https://openalex.org/W4298093005","https://openalex.org/W4301305932","https://openalex.org/W4301597078"],"related_works":["https://openalex.org/W4289341771","https://openalex.org/W4287115590","https://openalex.org/W2958076322","https://openalex.org/W3191284239","https://openalex.org/W3176376493","https://openalex.org/W2996787464","https://openalex.org/W2964268945","https://openalex.org/W3174419385","https://openalex.org/W3172572974","https://openalex.org/W2952832562"],"abstract_inverted_index":{"There":[0],"is":[1,60,83],"a":[2,37,63,84,100,112,157,160,179,189],"rising":[3],"interest":[4],"in":[5,48,93,111],"industrial":[6],"online":[7],"applications":[8],"where":[9,22],"data":[10],"becomes":[11],"available":[12],"sequentially.":[13],"Inspired":[14],"by":[15,135],"the":[16,29,32,50,55,70,78,91,104,131,136],"recommendation":[17,192],"of":[18,31,57,66,80,87,107,163,166,182],"playlists":[19],"to":[20,77,90,121],"users":[21],"their":[23,176],"preferences":[24],"can":[25],"be":[26,97],"collected":[27,138],"during":[28],"listening":[30],"entire":[33],"playlist,":[34],"we":[35],"study":[36],"novel":[38],"bandit":[39,154],"setting,":[40,73],"namely":[41,169],"Multi-Armed":[42],"Bandit":[43],"with":[44,54],"Temporally-Partitioned":[45],"Rewards":[46],"(TP-MAB),":[47],"which":[49,94,129],"stochastic":[51],"reward":[52,137,164],"associated":[53],"pull":[56,105],"an":[58],"arm":[59],"partitioned":[61],"over":[62,99,139],"finite":[64],"number":[65],"consecutive":[67],"rounds":[68],"following":[69],"pull.":[71],"This":[72],"unexplored":[74],"so":[75],"far":[76],"best":[79],"our":[81,144],"knowledge,":[82],"natural":[85],"extension":[86],"delayed-feedback":[88,153],"bandits":[89],"case":[92],"rewards":[95],"may":[96],"dilated":[98],"finite-time":[101],"span":[102],"after":[103],"instead":[106],"being":[108],"fully":[109],"disclosed":[110,134],"single,":[113],"potentially":[114],"delayed":[115],"round.":[116],"We":[117,141,172],"provide":[118,146],"two":[119],"algorithms":[120,145,155],"address":[122],"TP-MAB":[123],"problems,":[124],"namely,":[125],"TP-UCB-FR":[126],"and":[127,187],"TP-UCB-EW,":[128],"exploit":[130],"partial":[132],"information":[133],"time.":[140],"show":[142],"that":[143],"better":[147],"asymptotical":[148],"regret":[149],"upper":[150],"bounds":[151],"than":[152],"when":[156],"property":[158],"characterizing":[159],"broad":[161],"set":[162],"structures":[165],"practical":[167],"interest,":[168],"\u03b1-smoothness,":[170],"holds.":[171],"also":[173],"empirically":[174],"evaluate":[175],"performance":[177],"across":[178],"wide":[180],"range":[181],"settings,":[183],"both":[184],"synthetically":[185],"generated":[186],"from":[188],"real-world":[190],"media":[191],"problem.":[193]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
