{"id":"https://openalex.org/W4405375809","doi":"https://doi.org/10.1145/3708502","title":"Acceleration by Stepsize Hedging: Multi-Step Descent and the Silver Stepsize Schedule","display_name":"Acceleration by Stepsize Hedging: Multi-Step Descent and the Silver Stepsize Schedule","publication_year":2024,"publication_date":"2024-12-13","ids":{"openalex":"https://openalex.org/W4405375809","doi":"https://doi.org/10.1145/3708502"},"language":"en","primary_location":{"id":"doi:10.1145/3708502","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3708502","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3708502","source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3708502","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039466187","display_name":"Jason M. Altschuler","orcid":"https://orcid.org/0000-0001-7367-0097"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jason M. Altschuler","raw_affiliation_strings":["Statistics and Data Science, University of Pennsylvania, Philadelphia, United States"],"affiliations":[{"raw_affiliation_string":"Statistics and Data Science, University of Pennsylvania, Philadelphia, United States","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031935416","display_name":"Pablo A. Parrilo","orcid":"https://orcid.org/0000-0003-1132-8477"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pablo A. Parrilo","raw_affiliation_strings":["EECS, Massachusetts Institute of Technology, Cambridge, United States"],"affiliations":[{"raw_affiliation_string":"EECS, Massachusetts Institute of Technology, Cambridge, United States","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5039466187"],"corresponding_institution_ids":["https://openalex.org/I79576946"],"apc_list":null,"apc_paid":null,"fwci":1.548,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.85342394,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"72","issue":"2","first_page":"1","last_page":"38"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11720","display_name":"Probability and Risk Models","score":0.9427000284194946,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11720","display_name":"Probability and Risk Models","score":0.9427000284194946,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12276","display_name":"Risk Management in Financial Firms","score":0.9200999736785889,"subfield":{"id":"https://openalex.org/subfields/1402","display_name":"Accounting"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10974","display_name":"Advanced Queuing Theory Analysis","score":0.9157999753952026,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/descent","display_name":"Descent (aeronautics)","score":0.7862513661384583},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.7739670276641846},{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.7120659947395325},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5551775693893433},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5090391039848328},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.3219446539878845},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.32099610567092896},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2642698884010315},{"id":"https://openalex.org/keywords/aerospace-engineering","display_name":"Aerospace engineering","score":0.12707483768463135},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12271717190742493},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11997365951538086},{"id":"https://openalex.org/keywords/classical-mechanics","display_name":"Classical mechanics","score":0.0927843451499939}],"concepts":[{"id":"https://openalex.org/C2776637919","wikidata":"https://www.wikidata.org/wiki/Q624380","display_name":"Descent (aeronautics)","level":2,"score":0.7862513661384583},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.7739670276641846},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.7120659947395325},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5551775693893433},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5090391039848328},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3219446539878845},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.32099610567092896},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2642698884010315},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.12707483768463135},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12271717190742493},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11997365951538086},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0927843451499939},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3708502","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3708502","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3708502","source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3708502","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3708502","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3708502","source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4405375809.pdf"},"referenced_works_count":78,"referenced_works":["https://openalex.org/W1547678669","https://openalex.org/W1570787829","https://openalex.org/W1574151794","https://openalex.org/W1860742233","https://openalex.org/W1962121538","https://openalex.org/W1979896658","https://openalex.org/W1984543816","https://openalex.org/W1988720110","https://openalex.org/W1994949122","https://openalex.org/W2038281434","https://openalex.org/W2076605490","https://openalex.org/W2077067982","https://openalex.org/W2092039302","https://openalex.org/W2097460613","https://openalex.org/W2100556411","https://openalex.org/W2124768887","https://openalex.org/W2224301425","https://openalex.org/W2298465274","https://openalex.org/W2300441948","https://openalex.org/W2316564661","https://openalex.org/W2328312024","https://openalex.org/W2344703862","https://openalex.org/W2473376220","https://openalex.org/W2493337263","https://openalex.org/W2528062157","https://openalex.org/W2552959509","https://openalex.org/W2573743997","https://openalex.org/W2626639528","https://openalex.org/W2726042758","https://openalex.org/W2765941716","https://openalex.org/W2766326610","https://openalex.org/W2793027637","https://openalex.org/W2883109957","https://openalex.org/W2896740728","https://openalex.org/W2932270064","https://openalex.org/W2936995161","https://openalex.org/W2947452777","https://openalex.org/W2949330004","https://openalex.org/W2951248065","https://openalex.org/W2953231121","https://openalex.org/W2963040514","https://openalex.org/W2963430672","https://openalex.org/W2964093568","https://openalex.org/W2964102336","https://openalex.org/W3034271472","https://openalex.org/W3035235874","https://openalex.org/W3037153379","https://openalex.org/W3048571829","https://openalex.org/W3095979953","https://openalex.org/W3100569850","https://openalex.org/W3102299214","https://openalex.org/W3104372163","https://openalex.org/W3123616448","https://openalex.org/W3136523593","https://openalex.org/W3158960540","https://openalex.org/W3179524346","https://openalex.org/W3181590451","https://openalex.org/W3188803420","https://openalex.org/W4205547947","https://openalex.org/W4205841652","https://openalex.org/W4206742934","https://openalex.org/W4221142629","https://openalex.org/W4247858869","https://openalex.org/W4249667877","https://openalex.org/W4250589301","https://openalex.org/W4293775970","https://openalex.org/W4298289021","https://openalex.org/W4301435544","https://openalex.org/W4313598413","https://openalex.org/W4376312153","https://openalex.org/W4379652848","https://openalex.org/W4384389678","https://openalex.org/W4387225595","https://openalex.org/W4401813503","https://openalex.org/W4404668568","https://openalex.org/W6682852537","https://openalex.org/W6838928366","https://openalex.org/W6856794570"],"related_works":["https://openalex.org/W2486267010","https://openalex.org/W4298096494","https://openalex.org/W1678820847","https://openalex.org/W2559216629","https://openalex.org/W2065128788","https://openalex.org/W2903899051","https://openalex.org/W4246856022","https://openalex.org/W2147193423","https://openalex.org/W2367877056","https://openalex.org/W1987783546"],"abstract_inverted_index":{"Can":[0],"we":[1,17,252],"accelerate":[2],"the":[3,10,20,48,54,61,67,152,180,186,200,218,236,255,263,284,292,297,314,320],"convergence":[4,153,197],"of":[5,137,202,235,247,257,273,323],"gradient":[6],"descent":[7,261],"without":[8],"changing":[9],"algorithm\u2014just":[11],"by":[12,224,291],"judiciously":[13,301],"choosing":[14,302],"stepsizes?":[15],"Surprisingly,":[16],"show":[18],"that":[19,109,228,254,300],"answer":[21],"is":[22,47,53,58,81,122,131,167,212],"yes.":[23],"Our":[24],"proposed":[25],"Silver":[26,119],"Stepsize":[27,120],"Schedule":[28,121],"optimizes":[29],"strongly":[30],"convex":[31,79,308],"functions":[32],"in":[33,75,125,151,208,244,270,275,307,329],"\\(\\kappa":[34,70,139],"^{\\log":[35,140],"_{\\rho":[36,96,141],"}":[37,97,142],"2}":[38,98],"\\approx":[39,99],"\\kappa":[40],"^{0.7864}\\)":[41],"iterations,":[42],"where":[43],"\\(\\rho":[44],"=1+\\sqrt":[45],"{2}\\)":[46],"silver":[49],"ratio":[50],"and":[51,66,84,105,134,174,188,259,277,282],"\u03ba":[52,65],"condition":[55],"number.":[56],"This":[57,145,279],"intermediate":[59],"between":[60,169],"textbook":[62],"unaccelerated":[63],"rate":[64,69,93],"accelerated":[68,92],"^{1/2}\\)":[71],"due":[72,198,326],"to":[73,147,199,265,311,327],"Nesterov":[74],"1983.":[76],"The":[77,118,163,205],"non-strongly":[78],"setting":[80],"conceptually":[82],"identical,":[83],"standard":[85],"black-box":[86],"reductions":[87],"imply":[88],"an":[89],"analogous":[90],"partially":[91],"\\(\\varepsilon":[94],"^{-\\log":[95],"\\varepsilon":[100],"^{-0.7864}\\)":[101],".":[102,144],"We":[103,221],"conjecture":[104],"provide":[106],"partial":[107],"evidence":[108],"these":[110,193],"rates":[111],"are":[112,182],"optimal":[113],"among":[114],"all":[115],"stepsize":[116],"schedules.":[117],"constructed":[123],"recursively":[124,229],"a":[126,148,226,240,271],"fully":[127],"explicit":[128],"way.":[129],"It":[130],"non-monotonic,":[132],"fractal-like,":[133],"approximately":[135],"periodic":[136],"period":[138],"2}\\)":[143],"leads":[146],"phase":[149],"transition":[150],"rate:":[154],"initially":[155],"super-exponential":[156],"(acceleration":[157],"regime),":[158],"then":[159],"exponential":[160],"(saturation":[161],"regime).":[162],"core":[164],"algorithmic":[165,268],"intuition":[166],"hedging":[168,258],"individually":[170],"suboptimal":[171],"strategies\u2014short":[172],"steps":[173],"long":[175],"steps\u2014since":[176],"bad":[177],"cases":[178,184],"for":[179,185,296,319],"former":[181],"good":[183],"latter,":[187],"vice":[189],"versa.":[190],"Properly":[191],"combining":[192],"stepsizes":[194,303],"yields":[195],"faster":[196],"misalignment":[201],"worst-case":[203],"functions.":[204],"key":[206,241],"challenge":[207],"proving":[209],"this":[210,223,312],"speedup":[211],"enforcing":[213],"long-range":[214],"consistency":[215],"conditions":[216],"along":[217],"algorithm\u2019s":[219],"trajectory.":[220],"do":[222],"developing":[225],"technique":[227],"glues":[230],"constraints":[231],"from":[232],"different":[233],"portions":[234],"trajectory,":[237],"thus":[238],"removing":[239],"stumbling":[242],"block":[243],"previous":[245],"analyses":[246],"optimization":[248,276],"algorithms.":[249],"More":[250],"broadly,":[251],"believe":[253],"concepts":[256],"multi-step":[260],"have":[262],"potential":[264],"be":[266],"powerful":[267],"paradigms":[269],"variety":[272],"contexts":[274],"beyond.":[278],"article":[280],"publishes":[281],"extends":[283],"first":[285,298],"author\u2019s":[286],"2018":[287],"master\u2019s":[288],"thesis":[289],"(advised":[290],"second":[293],"author)\u2014which":[294],"established":[295],"time":[299],"can":[304],"enable":[305],"acceleration":[306],"optimization.":[309],"Prior":[310],"thesis,":[313],"only":[315],"such":[316],"result":[317],"was":[318],"special":[321],"case":[322],"quadratic":[324],"optimization,":[325],"Young":[328],"1953.":[330]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2024-12-14T00:00:00"}
