{"id":"https://openalex.org/W3022588902","doi":"https://doi.org/10.1109/ciss48834.2020.1570627382","title":"Escaping Saddle Points for Zeroth-order Non-convex Optimization using Estimated Gradient Descent","display_name":"Escaping Saddle Points for Zeroth-order Non-convex Optimization using Estimated Gradient Descent","publication_year":2020,"publication_date":"2020-03-01","ids":{"openalex":"https://openalex.org/W3022588902","doi":"https://doi.org/10.1109/ciss48834.2020.1570627382","mag":"3022588902"},"language":"en","primary_location":{"id":"doi:10.1109/ciss48834.2020.1570627382","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss48834.2020.1570627382","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 54th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075904309","display_name":"Qinbo Bai","orcid":"https://orcid.org/0000-0003-2933-1180"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qinbo Bai","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111079060","display_name":"Mridul Agarwal","orcid":null},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mridul Agarwal","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064822688","display_name":"Vaneet Aggarwal","orcid":"https://orcid.org/0000-0001-9131-4723"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vaneet Aggarwal","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5075904309"],"corresponding_institution_ids":["https://openalex.org/I219193219"],"apc_list":null,"apc_paid":null,"fwci":0.7042,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.64255377,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"abs 1902 4811v2","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10963","display_name":"Advanced Optimization Algorithms Research","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/2612","display_name":"Numerical Analysis"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stationary-point","display_name":"Stationary point","score":0.86146080493927},{"id":"https://openalex.org/keywords/saddle-point","display_name":"Saddle point","score":0.832413911819458},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.764862060546875},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6132709383964539},{"id":"https://openalex.org/keywords/convex-optimization","display_name":"Convex optimization","score":0.5120444893836975},{"id":"https://openalex.org/keywords/gradient-method","display_name":"Gradient method","score":0.5024070739746094},{"id":"https://openalex.org/keywords/descent","display_name":"Descent (aeronautics)","score":0.5004279613494873},{"id":"https://openalex.org/keywords/convex-function","display_name":"Convex function","score":0.49700120091438293},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.4911043643951416},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.4794993996620178},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4682517945766449},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.4635801315307617},{"id":"https://openalex.org/keywords/regular-polygon","display_name":"Regular polygon","score":0.4349513351917267},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4302509129047394},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4182325303554535},{"id":"https://openalex.org/keywords/convexity","display_name":"Convexity","score":0.41302230954170227},{"id":"https://openalex.org/keywords/hessian-matrix","display_name":"Hessian matrix","score":0.4130017161369324},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.23502078652381897},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.21664628386497498},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10718950629234314},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.10428369045257568},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.09367048740386963}],"concepts":[{"id":"https://openalex.org/C189237950","wikidata":"https://www.wikidata.org/wiki/Q2500758","display_name":"Stationary point","level":2,"score":0.86146080493927},{"id":"https://openalex.org/C2681867","wikidata":"https://www.wikidata.org/wiki/Q690935","display_name":"Saddle point","level":2,"score":0.832413911819458},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.764862060546875},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6132709383964539},{"id":"https://openalex.org/C157972887","wikidata":"https://www.wikidata.org/wiki/Q463359","display_name":"Convex optimization","level":3,"score":0.5120444893836975},{"id":"https://openalex.org/C115680565","wikidata":"https://www.wikidata.org/wiki/Q5977448","display_name":"Gradient method","level":2,"score":0.5024070739746094},{"id":"https://openalex.org/C2776637919","wikidata":"https://www.wikidata.org/wiki/Q624380","display_name":"Descent (aeronautics)","level":2,"score":0.5004279613494873},{"id":"https://openalex.org/C145446738","wikidata":"https://www.wikidata.org/wiki/Q319913","display_name":"Convex function","level":3,"score":0.49700120091438293},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.4911043643951416},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.4794993996620178},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4682517945766449},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.4635801315307617},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.4349513351917267},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4302509129047394},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4182325303554535},{"id":"https://openalex.org/C72134830","wikidata":"https://www.wikidata.org/wiki/Q5166524","display_name":"Convexity","level":2,"score":0.41302230954170227},{"id":"https://openalex.org/C203616005","wikidata":"https://www.wikidata.org/wiki/Q620495","display_name":"Hessian matrix","level":2,"score":0.4130017161369324},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.23502078652381897},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21664628386497498},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10718950629234314},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.10428369045257568},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.09367048740386963},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C106159729","wikidata":"https://www.wikidata.org/wiki/Q2294553","display_name":"Financial economics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ciss48834.2020.1570627382","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss48834.2020.1570627382","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 54th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W181733065","https://openalex.org/W2009941369","https://openalex.org/W2106005123","https://openalex.org/W2149479912","https://openalex.org/W2364072717","https://openalex.org/W2474090883","https://openalex.org/W2592651140","https://openalex.org/W2596367596","https://openalex.org/W2601846890","https://openalex.org/W2609037894","https://openalex.org/W2767380555","https://openalex.org/W2808670221","https://openalex.org/W2886474253","https://openalex.org/W2891057995","https://openalex.org/W2920022891","https://openalex.org/W2951610569","https://openalex.org/W2962876518","https://openalex.org/W2963092340","https://openalex.org/W2963446085","https://openalex.org/W2963586744","https://openalex.org/W2966868123","https://openalex.org/W2970054779","https://openalex.org/W2972203720","https://openalex.org/W2982492801","https://openalex.org/W2996534391","https://openalex.org/W3022588902","https://openalex.org/W3103457637","https://openalex.org/W4288420069","https://openalex.org/W4289543026","https://openalex.org/W4298326176","https://openalex.org/W6681804681","https://openalex.org/W6707261557","https://openalex.org/W6713348437","https://openalex.org/W6720643467","https://openalex.org/W6734280532","https://openalex.org/W6735641298","https://openalex.org/W6745438911","https://openalex.org/W6752743159","https://openalex.org/W6754297394","https://openalex.org/W6754584241","https://openalex.org/W6757770300","https://openalex.org/W6759850933","https://openalex.org/W6768219332","https://openalex.org/W6768873880"],"related_works":["https://openalex.org/W2963487351","https://openalex.org/W2769394111","https://openalex.org/W2978731891","https://openalex.org/W2963763253","https://openalex.org/W1526607502","https://openalex.org/W836608889","https://openalex.org/W3022588902","https://openalex.org/W4293777210","https://openalex.org/W4360890478","https://openalex.org/W4360998190"],"abstract_inverted_index":{"Gradient":[0],"descent":[1],"and":[2],"its":[3],"variants":[4],"are":[5,63],"widely":[6],"used":[7],"in":[8,20,65],"machine":[9,66],"learning.":[10],"However,":[11],"oracle":[12],"access":[13],"of":[14,27,35,98],"gradient":[15,28,37,40],"may":[16],"not":[17],"be":[18],"available":[19],"many":[21],"applications,":[22],"limiting":[23],"the":[24,55,59,76,99],"direct":[25],"use":[26],"descent.":[29],"This":[30],"paper":[31],"proposes":[32],"a":[33,45],"method":[34],"estimating":[36],"to":[38,44,69],"perform":[39],"descent,":[41],"that":[42,75],"converges":[43],"second-order":[46,60],"stationary":[47,57,61,85],"point":[48,86],"for":[49,101],"general":[50],"non-convex":[51,79],"optimization":[52,80],"problems.":[53],"Beyond":[54],"first-order":[56],"properties,":[58],"properties":[62],"important":[64],"learning":[67],"applications":[68],"achieve":[70],"better":[71],"performance.":[72],"We":[73],"show":[74],"proposed":[77],"model-free":[78],"algorithm":[81],"returns":[82],"an":[83],"\u03b5-second-order":[84],"with":[87],"\u00d5(d":[88],"<sup":[89,93],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[90,94],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[91],"+\u03b8/2/\u03b5":[92],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">8+\u03b8</sup>":[95],")":[96],"queries":[97],"function":[100],"any":[102],"arbitrary":[103],"\u03b8":[104],">":[105],"0.":[106]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
