{"id":"https://openalex.org/W2912134372","doi":"https://doi.org/10.1137/17m1150116","title":"A Newton-Based Method for Nonconvex Optimization with Fast Evasion of Saddle Points","display_name":"A Newton-Based Method for Nonconvex Optimization with Fast Evasion of Saddle Points","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2912134372","doi":"https://doi.org/10.1137/17m1150116","mag":"2912134372"},"language":"en","primary_location":{"id":"doi:10.1137/17m1150116","is_oa":false,"landing_page_url":"https://doi.org/10.1137/17m1150116","pdf_url":null,"source":{"id":"https://openalex.org/S928796702","display_name":"SIAM Journal on Optimization","issn_l":"1052-6234","issn":["1052-6234","1095-7189"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001418995","display_name":"Santiago Paternain","orcid":"https://orcid.org/0000-0001-6310-6345"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Santiago Paternain","raw_affiliation_strings":["Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA 19104"],"raw_orcid":"https://orcid.org/0000-0001-6310-6345","affiliations":[{"raw_affiliation_string":"Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA 19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008417632","display_name":"Aryan Mokhtari","orcid":"https://orcid.org/0000-0001-6603-0091"},"institutions":[{"id":"https://openalex.org/I4210143601","display_name":"Decision Systems (United States)","ror":"https://ror.org/0434dpa13","country_code":"US","type":"company","lineage":["https://openalex.org/I4210143601"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aryan Mokhtari","raw_affiliation_strings":["Laboratory for Information and Decision Systems, Massachusetts Institute of Technology, Cam-bridge, MA 02139"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratory for Information and Decision Systems, Massachusetts Institute of Technology, Cam-bridge, MA 02139","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078862959","display_name":"Alejandro Ribeiro","orcid":"https://orcid.org/0000-0003-4230-9906"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alejandro Ribeiro","raw_affiliation_strings":["Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA 19104"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA 19104","institution_ids":["https://openalex.org/I79576946"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.6612,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.96014935,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"29","issue":"1","first_page":"343","last_page":"368"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10963","display_name":"Advanced Optimization Algorithms Research","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2612","display_name":"Numerical Analysis"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.8196649551391602},{"id":"https://openalex.org/keywords/hessian-matrix","display_name":"Hessian matrix","score":0.7883948683738708},{"id":"https://openalex.org/keywords/saddle-point","display_name":"Saddle point","score":0.7495781779289246},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.4905790388584137},{"id":"https://openalex.org/keywords/newtons-method","display_name":"Newton's method","score":0.4876960217952728},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4705674350261688},{"id":"https://openalex.org/keywords/minification","display_name":"Minification","score":0.4630105495452881},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.4495750665664673},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4396416246891022},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.43545791506767273},{"id":"https://openalex.org/keywords/stationary-point","display_name":"Stationary point","score":0.43469658493995667},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3729622960090637},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.3637378513813019},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.23106342554092407},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.22575786709785461},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.15422791242599487},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.09941732883453369}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.8196649551391602},{"id":"https://openalex.org/C203616005","wikidata":"https://www.wikidata.org/wiki/Q620495","display_name":"Hessian matrix","level":2,"score":0.7883948683738708},{"id":"https://openalex.org/C2681867","wikidata":"https://www.wikidata.org/wiki/Q690935","display_name":"Saddle point","level":2,"score":0.7495781779289246},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.4905790388584137},{"id":"https://openalex.org/C85189116","wikidata":"https://www.wikidata.org/wiki/Q374195","display_name":"Newton's method","level":3,"score":0.4876960217952728},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4705674350261688},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.4630105495452881},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.4495750665664673},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4396416246891022},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.43545791506767273},{"id":"https://openalex.org/C189237950","wikidata":"https://www.wikidata.org/wiki/Q2500758","display_name":"Stationary point","level":2,"score":0.43469658493995667},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3729622960090637},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.3637378513813019},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.23106342554092407},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.22575786709785461},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.15422791242599487},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.09941732883453369},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1137/17m1150116","is_oa":false,"landing_page_url":"https://doi.org/10.1137/17m1150116","pdf_url":null,"source":{"id":"https://openalex.org/S928796702","display_name":"SIAM Journal on Optimization","issn_l":"1052-6234","issn":["1052-6234","1095-7189"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Optimization","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5689811493","display_name":null,"funder_award_id":"W911NF-17-2-0181","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"}],"funders":[{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1994974865","https://openalex.org/W2009941369","https://openalex.org/W2011970986","https://openalex.org/W2013621063","https://openalex.org/W2015836240","https://openalex.org/W2044293264","https://openalex.org/W2069426496","https://openalex.org/W2075184363","https://openalex.org/W2078626246","https://openalex.org/W2094879958","https://openalex.org/W2156005216","https://openalex.org/W2219888463","https://openalex.org/W2398500126","https://openalex.org/W2546420264","https://openalex.org/W2601846890","https://openalex.org/W2772283936","https://openalex.org/W3103457637"],"related_works":["https://openalex.org/W1978576933","https://openalex.org/W1981914421","https://openalex.org/W3125203780","https://openalex.org/W2355987247","https://openalex.org/W2153649672","https://openalex.org/W1979925556","https://openalex.org/W2983297293","https://openalex.org/W1989888202","https://openalex.org/W2978731891","https://openalex.org/W3022588902"],"abstract_inverted_index":{"Machine":[0],"learning":[1],"problems":[2],"such":[3],"as":[4],"neural":[5],"network":[6],"training,":[7],"tensor":[8],"decomposition,":[9],"and":[10,37,77,113],"matrix":[11,85],"factorization":[12],"require":[13],"local":[14,21,148],"minimization":[15,22],"of":[16,28,31,48,62,70,82,126,133,139],"a":[17,55,79,116,147],"nonconvex":[18],"function.":[19],"This":[20,52,124],"is":[23,94,109,130],"challenged":[24],"by":[25,65,73],"the":[26,60,67,71,83,89,110,122,142],"presence":[27],"saddle":[29],"points,":[30],"which":[32,39],"there":[33],"can":[34],"be":[35],"many":[36],"from":[38,121],"descent":[40],"methods":[41],"may":[42],"take":[43],"an":[44],"inordinately":[45],"large":[46],"number":[47],"iterations":[49],"to":[50,86,96,146],"escape.":[51],"paper":[53,143],"presents":[54],"second-order":[56],"method":[57,64,93],"that":[58],"modifies":[59],"update":[61],"Newton's":[63,140],"replacing":[66],"negative":[68],"eigenvalues":[69],"Hessian":[72],"their":[74],"absolute":[75],"values":[76],"uses":[78],"truncated":[80],"version":[81],"resulting":[84],"account":[87],"for":[88],"objective's":[90],"curvature.":[91],"The":[92],"shown":[95],"escape":[97,129],"saddles":[98],"in":[99,153],"at":[100],"most":[101],"$1":[102],"+":[103,155],"\\log_{3/2}":[104],"(\\delta/2\\varepsilon)$":[105],"iterations,":[106],"where":[107],"$\\varepsilon$":[108],"target":[111],"optimality":[112],"$\\delta$":[114],"characterizes":[115],"point":[117],"sufficiently":[118],"far":[119],"away":[120],"saddle.":[123],"base":[125],"this":[127],"exponential":[128],"$3/2$":[131],"independently":[132],"problem":[134],"constants.":[135],"Adding":[136],"classical":[137],"properties":[138],"method,":[141],"proves":[144],"convergence":[145],"minimum":[149],"with":[150],"probability":[151],"$1-p$":[152],"$O\\left(\\log(1/p))":[154],"O(\\log(1/\\varepsilon)\\right)$":[156],"iterations.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
