{"id":"https://openalex.org/W7160957623","doi":"https://doi.org/10.48550/arxiv.2605.10658","title":"Why Zeroth-Order Adaptation May Forget Less: A Randomized Shaping Theory","display_name":"Why Zeroth-Order Adaptation May Forget Less: A Randomized Shaping Theory","publication_year":2026,"publication_date":"2026-05-11","ids":{"openalex":"https://openalex.org/W7160957623","doi":"https://doi.org/10.48550/arxiv.2605.10658"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.10658","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.10658","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135943333","display_name":"Yao Shu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shu, Yao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135931253","display_name":"Jian Mu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135965133","display_name":"Zhongxiang Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Zhongxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6589999794960022,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6589999794960022,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.1386999934911728,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.015799999237060547,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.5990999937057495},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.5187000036239624},{"id":"https://openalex.org/keywords/curvature","display_name":"Curvature","score":0.48809999227523804},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4580000042915344},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.42570000886917114},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.4171999990940094},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.4092999994754791}],"concepts":[{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.5990999937057495},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5475000143051147},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.5187000036239624},{"id":"https://openalex.org/C195065555","wikidata":"https://www.wikidata.org/wiki/Q214881","display_name":"Curvature","level":2,"score":0.48809999227523804},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4580000042915344},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.42570000886917114},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.4171999990940094},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.4092999994754791},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39010000228881836},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.38019999861717224},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3610999882221222},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.349700003862381},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3481999933719635},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3377000093460083},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.33640000224113464},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C13355873","wikidata":"https://www.wikidata.org/wiki/Q2920850","display_name":"Connection (principal bundle)","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.27070000767707825},{"id":"https://openalex.org/C134786449","wikidata":"https://www.wikidata.org/wiki/Q3391255","display_name":"Planar","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C77265313","wikidata":"https://www.wikidata.org/wiki/Q879844","display_name":"Rest (music)","level":2,"score":0.25619998574256897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.10658","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.10658","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10658","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Continual":[0],"learning":[1],"requires":[2],"new-task":[3],"adaptation":[4,19,67,78],"without":[5],"damaging":[6],"previously":[7],"acquired":[8],"capabilities.":[9],"Recent":[10],"forward-pass":[11],"and":[12,153,197,225],"zeroth-order":[13],"(ZO)":[14],"results":[15],"show":[16],"that":[17,54,95,139],"low-query":[18],"may":[20,181],"retain":[21],"better":[22],"than":[23],"first-order":[24],"(FO)":[25],"descent,":[26],"but":[27],"the":[28,60,64,77,86,97,104,111,115,127,147,162,183],"usual":[29],"view":[30],"of":[31,138],"ZO":[32,121,164],"as":[33],"noisy":[34],"FO":[35,128,168],"estimation":[36],"does":[37],"not":[38],"explain":[39],"why.":[40],"We":[41],"give":[42],"a":[43,51,135,176],"local":[44,202,226],"randomized":[45,179],"gradient-shaping":[46],"analysis:":[47],"finite":[48],"differences":[49],"expose":[50],"raw":[52],"shape":[53,79,165],"is":[55,175,234],"mean-aligned":[56],"with":[57],"FO,":[58,188],"while":[59,101],"norm-matched":[61,84],"comparator":[62],"fixes":[63],"expected":[65,87],"squared":[66],"norm.":[68],"Under":[69],"this":[70,108,231],"controlled":[71],"comparison,":[72],"forgetting":[73,119,124],"depends":[74],"on":[75],"how":[76,220],"exposes":[80],"retention":[81,89,99,132,184],"curvature.":[82],"For":[83],"ZO,":[85,196],"shaped":[88],"curvature":[90,140],"obeys":[91],"an":[92,157],"exact":[93,167,189],"identity":[94,109],"preserves":[96],"isotropic":[98],"floor":[100],"contracting":[102],"only":[103],"anisotropic":[105],"component.":[106],"Projecting":[107],"onto":[110],"incoming":[112],"gradient":[113,207],"yields":[114],"observable":[116],"FO--ZO":[117],"quadratic":[118],"gap:":[120],"improves":[122],"mean":[123,148],"precisely":[125],"when":[126],"direction":[129],"has":[130],"above-average":[131],"curvature,":[133,222],"by":[134,187],"query-dependent":[136],"fraction":[137],"excess.":[141],"A":[142],"practical":[143],"finite-query":[144],"accounting":[145],"separates":[146,212],"mechanism":[149],"from":[150,194,215],"one-batch":[151],"sampling":[152,199],"smoothing":[154],"perturbations.":[155],"As":[156],"algorithmic":[158],"transfer,":[159],"RISE":[160],"applies":[161],"calibrated":[163],"to":[166,237],"gradients":[169,190],"inside":[170],"parameter":[171],"blocks.":[172],"Its":[173],"target":[174],"stability--plasticity":[177],"tradeoff:":[178],"shaping":[180,203,227],"reduce":[182],"exposure":[185],"paid":[186],"remove":[191],"finite-smoothing":[192],"bias":[193],"finite-difference":[195],"blockwise":[198,210],"supplies":[200],"many":[201],"directions":[204],"after":[205],"one":[206],"computation.":[208],"The":[209],"analysis":[211],"mean-step":[213],"damage":[214],"centered":[216],"random":[217],"exposure,":[218],"showing":[219],"block-diagonal":[221],"cross-block":[223],"coupling,":[224],"diagnostics":[228],"specify":[229],"where":[230],"exact-gradient":[232],"transfer":[233],"most":[235],"likely":[236],"be":[238],"visible.":[239]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
