{"id":"https://openalex.org/W4392222674","doi":"https://doi.org/10.48550/arxiv.2402.16463","title":"Learning to Schedule Online Tasks with Bandit Feedback","display_name":"Learning to Schedule Online Tasks with Bandit Feedback","publication_year":2024,"publication_date":"2024-02-26","ids":{"openalex":"https://openalex.org/W4392222674","doi":"https://doi.org/10.48550/arxiv.2402.16463"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.16463","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16463","pdf_url":"https://arxiv.org/pdf/2402.16463","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.16463","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101633731","display_name":"Yongxin Xu","orcid":"https://orcid.org/0000-0002-7347-8836"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xu, Yongxin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101648785","display_name":"Shangshang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Shangshang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101310365","display_name":"Hengquan Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Hengquan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028588934","display_name":"Xin Liu","orcid":"https://orcid.org/0000-0003-4420-0912"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5025859650","display_name":"Ziyu Shao","orcid":"https://orcid.org/0000-0002-8774-1391"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Ziyu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101633731"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.7603779435157776},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5944404602050781},{"id":"https://openalex.org/keywords/online-learning","display_name":"Online learning","score":0.4965994954109192},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33851200342178345},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.20558035373687744}],"concepts":[{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.7603779435157776},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5944404602050781},{"id":"https://openalex.org/C2986087404","wikidata":"https://www.wikidata.org/wiki/Q15946010","display_name":"Online learning","level":2,"score":0.4965994954109192},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33851200342178345},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.20558035373687744},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.16463","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16463","pdf_url":"https://arxiv.org/pdf/2402.16463","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2402.16463","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.16463","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.16463","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16463","pdf_url":"https://arxiv.org/pdf/2402.16463","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1427296098","display_name":null,"funder_award_id":"62302305","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392222674.pdf","grobid_xml":"https://content.openalex.org/works/W4392222674.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"Online":[0],"task":[1,29,42,69,105,152,181,185],"scheduling":[2,16,110,157,182],"serves":[3],"an":[4],"integral":[5],"role":[6],"for":[7,137,179],"task-intensive":[8],"applications":[9],"in":[10,50,196,209],"cloud":[11],"computing":[12],"and":[13,37,47,55,140,164,188,191,200],"crowdsourcing.":[14],"Optimal":[15],"can":[17],"enhance":[18],"system":[19,78],"performance,":[20],"typically":[21],"measured":[22],"by":[23],"the":[24,66,85,146,176,205,211],"reward-to-cost":[25,138,214],"ratio,":[26],"under":[27,111,183],"some":[28],"arrival":[30,70,89,106,153,186],"distribution.":[31,107],"On":[32,65],"one":[33],"hand,":[34,68],"both":[35],"reward":[36,54,190],"cost":[38,56],"are":[39],"dependent":[40],"on":[41],"context":[43],"(e.g.,":[44,91],"evaluation":[45],"metric)":[46],"remain":[48,72],"black-box":[49],"practice.":[51],"These":[52],"render":[53],"hard":[57],"to":[58,74,149],"model":[59],"thus":[60],"unknown":[61,189],"before":[62],"decision":[63,142],"making.":[64],"other":[67,218],"behaviors":[71],"sensitive":[73],"factors":[75],"like":[76],"unpredictable":[77],"fluctuation":[79],"whereby":[80],"a":[81,112,120,130,141,169,197,201],"prior":[82],"estimation":[83,136],"or":[84],"conventional":[86],"assumption":[87],"of":[88,172,207],"distribution":[90,154,187],"Poisson)":[92],"may":[93],"fail.":[94],"This":[95],"implies":[96],"another":[97],"practical":[98],"yet":[99],"often":[100],"neglected":[101],"challenge,":[102],"i.e.,":[103],"uncertain":[104,184],"Towards":[108],"effective":[109],"stationary":[113],"environment":[114],"with":[115,168,217],"various":[116],"uncertainties,":[117],"we":[118],"propose":[119],"double-optimistic":[121],"learning":[122,131,167],"based":[123],"Robbins-Monro":[124,147],"(DOL-RM)":[125],"algorithm.":[126],"Specifically,":[127],"DOL-RM":[128,160,208],"integrates":[129],"module":[132,143],"that":[133,144],"incorporates":[134],"optimistic":[135],"ratio":[139,215],"utilizes":[145],"method":[148],"implicitly":[150],"learn":[151],"while":[155],"making":[156],"decisions.":[158],"Theoretically,":[159],"achieves":[161],"convergence":[162],"gap":[163],"no":[165],"regret":[166,171],"sub-linear":[170],"$O(T^{3/4})$,":[173],"which":[174],"is":[175],"first":[177],"result":[178],"online":[180],"cost.":[192],"Our":[193],"numerical":[194],"results":[195],"synthetic":[198],"experiment":[199],"real-world":[202],"application":[203],"demonstrate":[204],"effectiveness":[206],"achieving":[210],"best":[212],"cumulative":[213],"compared":[216],"state-of-the-art":[219],"baselines.":[220]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
