{"id":"https://openalex.org/W4225947038","doi":"https://doi.org/10.1109/isit50566.2022.9834691","title":"Accelerated Proximal Alternating Gradient-Descent-Ascent for Nonconvex Minimax Machine Learning","display_name":"Accelerated Proximal Alternating Gradient-Descent-Ascent for Nonconvex Minimax Machine Learning","publication_year":2022,"publication_date":"2022-06-26","ids":{"openalex":"https://openalex.org/W4225947038","doi":"https://doi.org/10.1109/isit50566.2022.9834691"},"language":"en","primary_location":{"id":"doi:10.1109/isit50566.2022.9834691","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit50566.2022.9834691","pdf_url":null,"source":{"id":"https://openalex.org/S4363604560","display_name":"2022 IEEE International Symposium on Information Theory (ISIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016356334","display_name":"Ziyi Chen","orcid":"https://orcid.org/0000-0002-5110-3400"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ziyi Chen","raw_affiliation_strings":["University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US"],"affiliations":[{"raw_affiliation_string":"University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002089057","display_name":"Shaocong Ma","orcid":"https://orcid.org/0009-0007-4414-0303"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shaocong Ma","raw_affiliation_strings":["University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US"],"affiliations":[{"raw_affiliation_string":"University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101704070","display_name":"Yi Zhou","orcid":"https://orcid.org/0000-0002-3982-9145"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Zhou","raw_affiliation_strings":["University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US"],"affiliations":[{"raw_affiliation_string":"University of Utah,Electrical &#x0026; Computer Engineering,Salt Lake City,US","institution_ids":["https://openalex.org/I223532165"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5016356334"],"corresponding_institution_ids":["https://openalex.org/I223532165"],"apc_list":null,"apc_paid":null,"fwci":1.0326,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.84378284,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"672","last_page":"677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimax","display_name":"Minimax","score":0.8254073858261108},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.7365738749504089},{"id":"https://openalex.org/keywords/descent","display_name":"Descent (aeronautics)","score":0.6622484922409058},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6528922319412231},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.42697784304618835},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38281089067459106},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.23618677258491516},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10620149970054626},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.05032986402511597}],"concepts":[{"id":"https://openalex.org/C149728462","wikidata":"https://www.wikidata.org/wiki/Q751319","display_name":"Minimax","level":2,"score":0.8254073858261108},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.7365738749504089},{"id":"https://openalex.org/C2776637919","wikidata":"https://www.wikidata.org/wiki/Q624380","display_name":"Descent (aeronautics)","level":2,"score":0.6622484922409058},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6528922319412231},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.42697784304618835},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38281089067459106},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.23618677258491516},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10620149970054626},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.05032986402511597},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isit50566.2022.9834691","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit50566.2022.9834691","pdf_url":null,"source":{"id":"https://openalex.org/S4363604560","display_name":"2022 IEEE International Symposium on Information Theory (ISIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1565791184","https://openalex.org/W1987083649","https://openalex.org/W1988720110","https://openalex.org/W2000462146","https://openalex.org/W2019569173","https://openalex.org/W2020123437","https://openalex.org/W2100556411","https://openalex.org/W2101868363","https://openalex.org/W2112796928","https://openalex.org/W2168914046","https://openalex.org/W2184634347","https://openalex.org/W2616127482","https://openalex.org/W2804907179","https://openalex.org/W2914904265","https://openalex.org/W2947996939","https://openalex.org/W2962173422","https://openalex.org/W2962717811","https://openalex.org/W2962834223","https://openalex.org/W2963809785","https://openalex.org/W2970416783","https://openalex.org/W2981188016","https://openalex.org/W2999929232","https://openalex.org/W3033192442","https://openalex.org/W3035413499","https://openalex.org/W3035665052","https://openalex.org/W3046366290","https://openalex.org/W3049427434","https://openalex.org/W3081204256","https://openalex.org/W3092878522","https://openalex.org/W3101286035","https://openalex.org/W3118809778","https://openalex.org/W3135167421","https://openalex.org/W3141595720","https://openalex.org/W3155261051","https://openalex.org/W3183755892","https://openalex.org/W3213732694","https://openalex.org/W4244387609","https://openalex.org/W4287704934","https://openalex.org/W4289754199","https://openalex.org/W4289760629","https://openalex.org/W4297944735","https://openalex.org/W4299356147","https://openalex.org/W4320013936","https://openalex.org/W6633965997","https://openalex.org/W6685044387","https://openalex.org/W6686534882","https://openalex.org/W6738096397","https://openalex.org/W6738677829","https://openalex.org/W6745454490","https://openalex.org/W6748056922","https://openalex.org/W6751852773","https://openalex.org/W6752646127","https://openalex.org/W6753194085","https://openalex.org/W6759395059","https://openalex.org/W6763288952","https://openalex.org/W6763496775","https://openalex.org/W6763832118","https://openalex.org/W6766481192","https://openalex.org/W6769434743","https://openalex.org/W6772547972","https://openalex.org/W6774091466","https://openalex.org/W6778862977","https://openalex.org/W6782470715","https://openalex.org/W6803986650"],"related_works":["https://openalex.org/W2486267010","https://openalex.org/W2016058626","https://openalex.org/W2474724840","https://openalex.org/W4298096494","https://openalex.org/W2963760573","https://openalex.org/W1678820847","https://openalex.org/W185788778","https://openalex.org/W2895916002","https://openalex.org/W3182145356","https://openalex.org/W2015288657"],"abstract_inverted_index":{"Alternating":[0],"gradient-descent-ascent":[1],"(AltGDA)":[2],"is":[3,110,118],"an":[4,153],"optimization":[5,27,70,91],"algorithm":[6,56,82,151],"that":[7,34,57,80],"has":[8],"been":[9],"widely":[10],"used":[11],"for":[12],"model":[13],"training":[14],"in":[15,42,88,97,142],"various":[16],"machine":[17],"learning":[18],"applications,":[19],"which":[20],"aims":[21],"to":[22,65,84],"solve":[23,66],"a":[24,38,51,85,94,124],"nonconvex":[25,43,68,89],"minimax":[26,44,69,90],"problem.":[28],"However,":[29],"the":[30,74,81,98,111,119,128,138,147],"existing":[31],"studies":[32],"show":[33],"it":[35],"suffers":[36],"from":[37],"high":[39],"computation":[40,95,125],"complexity":[41,96,126],"optimization.":[45],"In":[46],"this":[47],"paper,":[48],"we":[49,78],"develop":[50],"single-loop":[52,132],"and":[53,62,92,116,134],"fast":[54],"AltGDA-type":[55],"leverages":[58],"proximal":[59],"gradient":[60],"updates":[61],"momentum":[63,75],"acceleration":[64,76],"regularized":[67],"problems.":[71],"By":[72],"leveraging":[73],"technique,":[77],"prove":[79],"converges":[83],"critical":[86],"point":[87],"achieves":[93],"order":[99],"of":[100,114,131,140,149],"$\\mathcal{O}\\left(":[101],"{{\\kappa":[102],"^{\\frac{{11}}{6}}}{\\varepsilon":[103],"^{":[104],"-":[105],"2}}}":[106],"\\right)$,":[107],"where":[108],"\u03f5":[109],"desired":[112],"level":[113],"accuracy":[115],"\u03ba":[117],"problem\u2019s":[120],"condition":[121],"number.":[122],"Such":[123],"improves":[127],"state-of-the-art":[129],"complexities":[130],"GDA":[133],"AltGDA":[135],"algorithms":[136],"(see":[137],"summary":[139],"comparison":[141],"Table":[143],"I).":[144],"We":[145],"demonstrate":[146],"effectiveness":[148],"our":[150],"via":[152],"experiment":[154],"on":[155],"adversarial":[156],"deep":[157],"learning.":[158]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
