{"id":"https://openalex.org/W7156976908","doi":"https://doi.org/10.48550/arxiv.2604.23436","title":"Inference of Online Newton Methods with Nesterov's Accelerated Sketching","display_name":"Inference of Online Newton Methods with Nesterov's Accelerated Sketching","publication_year":2026,"publication_date":"2026-04-25","ids":{"openalex":"https://openalex.org/W7156976908","doi":"https://doi.org/10.48550/arxiv.2604.23436"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.23436","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23436","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.23436","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134772617","display_name":"Haoxuan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haoxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134773514","display_name":"Xinchen Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Xinchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5056179845","display_name":"Sen Na","orcid":"https://orcid.org/0000-0002-7977-5276"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Na, Sen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9355999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9355999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.013399999588727951,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.012500000186264515,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.5889999866485596},{"id":"https://openalex.org/keywords/hessian-matrix","display_name":"Hessian matrix","score":0.5149000287055969},{"id":"https://openalex.org/keywords/smoothness","display_name":"Smoothness","score":0.5139999985694885},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4837000072002411},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.44269999861717224},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4253000020980835},{"id":"https://openalex.org/keywords/covariance","display_name":"Covariance","score":0.4221999943256378},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.39879998564720154},{"id":"https://openalex.org/keywords/newtons-method","display_name":"Newton's method","score":0.3856000006198883}],"concepts":[{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.5889999866485596},{"id":"https://openalex.org/C203616005","wikidata":"https://www.wikidata.org/wiki/Q620495","display_name":"Hessian matrix","level":2,"score":0.5149000287055969},{"id":"https://openalex.org/C102634674","wikidata":"https://www.wikidata.org/wiki/Q868473","display_name":"Smoothness","level":2,"score":0.5139999985694885},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5005000233650208},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4837000072002411},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.44269999861717224},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.43529999256134033},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4253000020980835},{"id":"https://openalex.org/C178650346","wikidata":"https://www.wikidata.org/wiki/Q201984","display_name":"Covariance","level":2,"score":0.4221999943256378},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4131999909877777},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4009999930858612},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.39879998564720154},{"id":"https://openalex.org/C85189116","wikidata":"https://www.wikidata.org/wiki/Q374195","display_name":"Newton's method","level":3,"score":0.3856000006198883},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.3824000060558319},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.37389999628067017},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.3675000071525574},{"id":"https://openalex.org/C65778772","wikidata":"https://www.wikidata.org/wiki/Q12345341","display_name":"Asymptotic distribution","level":3,"score":0.3450999855995178},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.31619998812675476},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.30550000071525574},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.295199990272522},{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C2776157432","wikidata":"https://www.wikidata.org/wiki/Q1375683","display_name":"Normality","level":2,"score":0.28619998693466187},{"id":"https://openalex.org/C55479107","wikidata":"https://www.wikidata.org/wiki/Q97663916","display_name":"Stochastic approximation","level":3,"score":0.2768999934196472},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2759000062942505},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C179127668","wikidata":"https://www.wikidata.org/wiki/Q17086396","display_name":"Newton's method in optimization","level":4,"score":0.2635999917984009},{"id":"https://openalex.org/C101104100","wikidata":"https://www.wikidata.org/wiki/Q1063540","display_name":"Heteroscedasticity","level":2,"score":0.2542000114917755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25369998812675476},{"id":"https://openalex.org/C114954040","wikidata":"https://www.wikidata.org/wiki/Q1476018","display_name":"Quasi-Newton method","level":4,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.23436","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23436","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.23436","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23436","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8300793766975403,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reliable":[0],"decision-making":[1],"with":[2,65,81,98,141,157],"streaming":[3],"data":[4,119],"requires":[5],"principled":[6],"uncertainty":[7,114,166],"quantification":[8,167],"of":[9,42,104,137,170,187],"online":[10,78,154,192],"methods.":[11,106],"While":[12],"first-order":[13,105],"methods":[14,175],"enable":[15],"efficient":[16],"iterate":[17,140],"updates,":[18],"their":[19],"inference":[20,47],"procedures":[21],"still":[22],"require":[23],"updating":[24],"proper":[25],"(covariance)":[26],"matrices,":[27],"incurring":[28],"$O(d^2)$":[29,102],"time":[30],"and":[31,34,39,120,126,150,172],"memory":[32],"complexity,":[33],"are":[35],"sensitive":[36],"to":[37,168],"ill-conditioning":[38],"noise":[40],"heterogeneity":[41],"the":[43,85,108,138,164,185,188],"problem.":[44],"This":[45],"costly":[46],"task":[48],"offers":[49],"an":[50,77],"opportunity":[51],"for":[52,191],"more":[53],"robust":[54],"second-order":[55],"methods,":[56],"which":[57],"are,":[58],"however,":[59],"bottlenecked":[60],"by":[61,75,146],"solving":[62],"Newton":[63,79,86,174],"systems":[64],"$O(d^3)$":[66],"complexity.":[67],"In":[68],"this":[69,73],"paper,":[70],"we":[71,111,129],"address":[72],"gap":[74],"studying":[76],"method":[80,190],"Hessian":[82],"averaging,":[83],"where":[84],"direction":[87],"at":[88],"each":[89],"step":[90],"is":[91],"approximately":[92],"computed":[93],"using":[94],"a":[95,142,147,152],"sketch-and-project":[96],"solver":[97],"Nesterov's":[99,177],"acceleration,":[100],"matching":[101],"complexity":[103],"For":[107],"proposed":[109,189],"method,":[110],"quantify":[112],"its":[113],"arising":[115],"from":[116],"both":[117],"random":[118],"randomized":[121],"computation.":[122],"Under":[123],"standard":[124],"smoothness":[125],"moment":[127],"conditions,":[128],"establish":[130],"global":[131],"almost-sure":[132],"convergence,":[133],"prove":[134],"asymptotic":[135],"normality":[136],"last":[139],"limiting":[143],"covariance":[144,155],"characterized":[145],"Lyapunov":[148],"equation,":[149],"develop":[151],"fully":[153],"estimator":[156],"non-asymptotic":[158],"convergence":[159],"guarantees.":[160],"We":[161],"also":[162],"connect":[163],"resulting":[165],"that":[169],"exact":[171],"sketched":[173],"without":[176],"acceleration.":[178],"Extensive":[179],"experiments":[180],"on":[181],"regression":[182],"models":[183],"demonstrate":[184],"superiority":[186],"inference.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-29T00:00:00"}
