{"id":"https://openalex.org/W4414360301","doi":"https://doi.org/10.24963/ijcai.2025/672","title":"Stability and Generalization for Stochastic (Compositional) Optimizations","display_name":"Stability and Generalization for Stochastic (Compositional) Optimizations","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4414360301","doi":"https://doi.org/10.24963/ijcai.2025/672"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2025/672","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108865405","display_name":"Xiaokang Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaokang Pan","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University","Xiangjiang Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]},{"raw_affiliation_string":"Xiangjiang Laboratory","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108047622","display_name":"Jin Liu","orcid":"https://orcid.org/0000-0002-2026-2513"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University","Xiangjiang Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]},{"raw_affiliation_string":"Xiangjiang Laboratory","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005496603","display_name":"Hulin Kuang","orcid":"https://orcid.org/0000-0001-7341-9871"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hulin Kuang","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University","Xiangjiang Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]},{"raw_affiliation_string":"Xiangjiang Laboratory","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001159156","display_name":"Youqi Li","orcid":"https://orcid.org/0000-0003-3867-5997"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youqi Li","raw_affiliation_strings":["School of Computer Science and Technology, Beijing Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085364987","display_name":"Lixing Chen","orcid":"https://orcid.org/0000-0002-1805-0183"},"institutions":[{"id":"https://openalex.org/I1292585137","display_name":"United States Social Security Administration","ror":"https://ror.org/04b7xxn32","country_code":"US","type":"government","lineage":["https://openalex.org/I1292585137"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Lixing Chen","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University","Shanghai Key Laboratory of Integrated Administration Technologies for Information Security"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"Shanghai Key Laboratory of Integrated Administration Technologies for Information Security","institution_ids":["https://openalex.org/I1292585137"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073473903","display_name":"Zhe Qu","orcid":"https://orcid.org/0000-0002-6368-2147"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Qu","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University","Xiangjiang Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]},{"raw_affiliation_string":"Xiangjiang Laboratory","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27932947,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6039","last_page":"6047"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11053","display_name":"Process Optimization and Integration","score":0.30709999799728394,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11053","display_name":"Process Optimization and Integration","score":0.30709999799728394,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.29499998688697815,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.2669000029563904,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7997999787330627},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.7289000153541565},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.6345000267028809},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5623999834060669},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5338000059127808},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.39910000562667847},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.39890000224113464},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3926999866962433}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7997999787330627},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.7289000153541565},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.6345000267028809},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5623999834060669},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5547999739646912},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5338000059127808},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5078999996185303},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.39910000562667847},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.39890000224113464},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3926999866962433},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.38989999890327454},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.37540000677108765},{"id":"https://openalex.org/C194387892","wikidata":"https://www.wikidata.org/wiki/Q1747770","display_name":"Stochastic optimization","level":2,"score":0.36959999799728394},{"id":"https://openalex.org/C145446738","wikidata":"https://www.wikidata.org/wiki/Q319913","display_name":"Convex function","level":3,"score":0.3427000045776367},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3366999924182892},{"id":"https://openalex.org/C157972887","wikidata":"https://www.wikidata.org/wiki/Q463359","display_name":"Convex optimization","level":3,"score":0.326200008392334},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.3181000053882599},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.31610000133514404},{"id":"https://openalex.org/C55479107","wikidata":"https://www.wikidata.org/wiki/Q97663916","display_name":"Stochastic approximation","level":3,"score":0.3107999861240387},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C148764684","wikidata":"https://www.wikidata.org/wiki/Q621751","display_name":"Approximation algorithm","level":2,"score":0.2815999984741211},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.27720001339912415},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2025/672","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"use":[1],"of":[2,5,66,107,117,132,140,147,153,176],"estimators":[3,32,108],"instead":[4],"stochastic":[6,43,47],"gradients":[7],"for":[8,173],"updates":[9],"has":[10],"been":[11],"shown":[12],"to":[13,79,128],"improve":[14],"algorithm":[15,69],"convergence":[16,194],"rates":[17,195],"of,":[18],"but":[19],"their":[20],"impact":[21,106,182],"on":[22,38,109],"generalization":[23,64,99,183,201],"remains":[24],"under-explored.":[25],"In":[26,167],"this":[27,94,122],"paper,":[28],"we":[29,60,96,112,142],"investigate":[30],"how":[31],"influence":[33],"generalization.":[34,110],"Our":[35,160],"focus":[36],"is":[37],"two":[39,163],"widely":[40],"studied":[41],"problems:":[42],"optimization":[44,49],"(SO)":[45],"and":[46,54,126,149,189],"compositional":[48],"(SCO),":[50],"both":[51],"under":[52],"convex":[53],"non-convex":[55,158],"settings.":[56],"For":[57],"SO":[58],"problems,":[59,169],"first":[61],"analyze":[62],"the":[63,67,105,130,138,157,171,174,177],"error":[65],"STORM":[68],"as":[70],"a":[71,98,114,144,150],"foundational":[72],"step.":[73],"We":[74],"then":[75],"extend":[76],"our":[77],"analysis":[78,116,161],"SCO":[80,168],"problems":[81],"by":[82],"introducing":[83],"an":[84],"algorithmic":[85,91],"framework":[86],"that":[87],"encompasses":[88],"several":[89],"popular":[90],"approaches.":[92],"Through":[93],"framework,":[95],"conduct":[97],"analysis,":[100],"uncovering":[101],"new":[102,151],"insights":[103],"into":[104],"Subsequently,":[111],"provide":[113],"detailed":[115],"three":[118],"specific":[119],"algorithms":[120],"within":[121],"framework:":[123],"SCGD,":[124],"SCSC,":[125],"COVER,":[127],"explore":[129],"effects":[131],"different":[133],"estimator":[134,172],"strategies.":[135],"Furthermore,":[136],"in":[137,156],"context":[139],"SCO,":[141],"propose":[143],"novel":[145],"definition":[146],"stability":[148],"decomposition":[152],"excess":[154],"risk":[155],"setting.":[159],"indicates":[162],"key":[164],"findings:":[165],"(1)":[166],"eliminating":[170],"gradient":[175],"inner":[178],"function":[179],"does":[180],"not":[181],"performance":[184],"while":[185],"significantly":[186],"reducing":[187],"computational":[188],"storage":[190],"overhead.":[191],"(2)":[192],"Faster":[193],"are":[196],"consistently":[197],"associated":[198],"with":[199],"better":[200],"performance.":[202]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
