{"id":"https://openalex.org/W2962987366","doi":"https://doi.org/10.1145/3321408.3323078","title":"Second-order multi-armed bandit learning for online optimization in communication and networks","display_name":"Second-order multi-armed bandit learning for online optimization in communication and networks","publication_year":2019,"publication_date":"2019-05-17","ids":{"openalex":"https://openalex.org/W2962987366","doi":"https://doi.org/10.1145/3321408.3323078","mag":"2962987366"},"language":"en","primary_location":{"id":"doi:10.1145/3321408.3323078","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3321408.3323078","pdf_url":null,"source":{"id":"https://openalex.org/S4306523950","display_name":"Proceedings of the ACM Turing Celebration Conference - China","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Turing Celebration Conference - China","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004489029","display_name":"Zhiyong Du","orcid":"https://orcid.org/0000-0001-8925-4960"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyong Du","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066951710","display_name":"Bin Jiang","orcid":"https://orcid.org/0000-0003-3177-2970"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Jiang","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046010374","display_name":"Kun Xu","orcid":"https://orcid.org/0000-0003-2050-9042"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Xu","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073732148","display_name":"Shengyun Wei","orcid":"https://orcid.org/0000-0002-0358-190X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengyun Wei","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056629689","display_name":"Shengqing Wang","orcid":"https://orcid.org/0000-0002-7880-8451"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengqing Wang","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5106466651","display_name":"Huatao Zhu","orcid":"https://orcid.org/0000-0001-5314-4954"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huatao Zhu","raw_affiliation_strings":["National University of Defense Technology, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5004489029"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":1.1784,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.76510638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7065352201461792},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.604192316532135},{"id":"https://openalex.org/keywords/multi-armed-bandit","display_name":"Multi-armed bandit","score":0.5031830668449402},{"id":"https://openalex.org/keywords/online-learning","display_name":"Online learning","score":0.49048277735710144},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32372158765792847},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.32307136058807373},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.22854703664779663},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.1641586720943451},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09488239884376526},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.07995414733886719}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7065352201461792},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.604192316532135},{"id":"https://openalex.org/C123197309","wikidata":"https://www.wikidata.org/wiki/Q2882343","display_name":"Multi-armed bandit","level":3,"score":0.5031830668449402},{"id":"https://openalex.org/C2986087404","wikidata":"https://www.wikidata.org/wiki/Q15946010","display_name":"Online learning","level":2,"score":0.49048277735710144},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32372158765792847},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32307136058807373},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.22854703664779663},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.1641586720943451},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09488239884376526},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.07995414733886719},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3321408.3323078","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3321408.3323078","pdf_url":null,"source":{"id":"https://openalex.org/S4306523950","display_name":"Proceedings of the ACM Turing Celebration Conference - China","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Turing Celebration Conference - China","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.46000000834465027}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1496659747","https://openalex.org/W1751431909","https://openalex.org/W1973027670","https://openalex.org/W1998027131","https://openalex.org/W2009551863","https://openalex.org/W2015056750","https://openalex.org/W2074341757","https://openalex.org/W2088530598","https://openalex.org/W2108114251","https://openalex.org/W2120125372","https://openalex.org/W2121863487","https://openalex.org/W2140571193","https://openalex.org/W2157146750","https://openalex.org/W2168405694","https://openalex.org/W2270701543","https://openalex.org/W2295471379","https://openalex.org/W2735793369","https://openalex.org/W2791827017","https://openalex.org/W2884396969","https://openalex.org/W2962748815","https://openalex.org/W3102381603","https://openalex.org/W4214717370","https://openalex.org/W4299811804"],"related_works":["https://openalex.org/W2398102130","https://openalex.org/W1587673378","https://openalex.org/W3188962172","https://openalex.org/W2772917594","https://openalex.org/W4306742369","https://openalex.org/W4303457083","https://openalex.org/W4212898069","https://openalex.org/W2131146434","https://openalex.org/W2951359407","https://openalex.org/W3113630707"],"abstract_inverted_index":{"Multi-armed":[0],"bandit":[1],"(MAB)":[2],"based":[3],"reinforcement":[4],"learning,":[5],"which":[6],"is":[7,38,73,156,165],"able":[8],"to":[9,39,110,173],"learn":[10,40],"in":[11,29,82,116,193],"dynamic":[12,78,106],"and":[13,31,90,136,182,195],"uncertain":[14],"environments":[15],"with":[16],"analytic":[17],"performance":[18],"bound,":[19],"provides":[20],"a":[21,76,126,131,152,185],"robust":[22],"optimization":[23],"framework":[24],"for":[25],"resource":[26,190],"optimization/scheduling":[27,191],"problems":[28,192],"communication":[30,56,194],"networks.":[32,196],"The":[33,178],"goal":[34],"of":[35,71,88,93,107,144,189],"MAB":[36,99,128,180],"problem":[37],"the":[41,45,48,60,63,68,104,141,162,175],"best":[42,133],"arms,":[43],"i.e.,":[44],"arms":[46],"provide":[47,111],"largest":[49],"reward":[50,72,145],"mean":[51,61],"when":[52,114],"played.":[53],"In":[54],"actual":[55],"systems,":[57,89],"not":[58,102],"only":[59],"(i.e.,":[62],"first-order":[64],"statistic),":[65],"but":[66],"also":[67],"second-order":[69,105,127,142,153,179],"dynamics":[70,143],"important,":[74],"since":[75],"larger":[77],"range":[79],"may":[80],"result":[81],"more":[83,186],"frequent":[84],"reconfiguration":[85],"or":[86],"adaptation":[87],"user":[91],"quality":[92],"experience":[94],"(QoE)":[95],"degradation.":[96],"However,":[97],"traditional":[98],"models":[100],"did":[101],"consider":[103],"reward,":[108],"failing":[109],"tailored":[112],"characterization":[113,188],"applied":[115],"communications.":[117],"Motivated":[118],"by":[119],"this":[120,122],"issue,":[121],"paper":[123],"first":[124],"proposes":[125],"problem.":[129],"Specifically,":[130],"new":[132],"arm":[134],"metric":[135],"associated":[137],"regret":[138],"that":[139,161],"take":[140],"into":[146],"account":[147],"explicitly":[148],"are":[149,171],"redefined.":[150],"Then,":[151],"learning":[154],"algorithm":[155,164,183],"designed.":[157],"We":[158],"further":[159],"prove":[160],"proposed":[163,176],"order-optimal.":[166],"Finally,":[167],"some":[168],"simulation":[169],"results":[170],"presented":[172],"validate":[174],"algorithm.":[177],"model":[181],"enable":[184],"fine-grained":[187]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
