{"id":"https://openalex.org/W4392911125","doi":"https://doi.org/10.1109/icassp48485.2024.10447312","title":"Fast Test Error Rates for Gradient-Based Algorithms on Separable Data","display_name":"Fast Test Error Rates for Gradient-Based Algorithms on Separable Data","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392911125","doi":"https://doi.org/10.1109/icassp48485.2024.10447312"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10447312","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447312","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053095531","display_name":"Puneesh Deora","orcid":null},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Puneesh Deora","raw_affiliation_strings":["University of British Columbia"],"affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071075838","display_name":"Bhavya Vasudeva","orcid":"https://orcid.org/0000-0003-1307-3017"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I2800817003","display_name":"Southern California University for Professional Studies","ror":"https://ror.org/058zz0t50","country_code":"US","type":"education","lineage":["https://openalex.org/I2800817003"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bhavya Vasudeva","raw_affiliation_strings":["University of Southern California"],"affiliations":[{"raw_affiliation_string":"University of Southern California","institution_ids":["https://openalex.org/I2800817003","https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009088661","display_name":"Vatsal Sharan","orcid":"https://orcid.org/0009-0003-1280-5623"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I2800817003","display_name":"Southern California University for Professional Studies","ror":"https://ror.org/058zz0t50","country_code":"US","type":"education","lineage":["https://openalex.org/I2800817003"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vatsal Sharan","raw_affiliation_strings":["University of Southern California"],"affiliations":[{"raw_affiliation_string":"University of Southern California","institution_ids":["https://openalex.org/I2800817003","https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024812488","display_name":"Christos Thrampoulidis","orcid":"https://orcid.org/0000-0001-9053-9365"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Christos Thrampoulidis","raw_affiliation_strings":["University of British Columbia"],"affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053095531"],"corresponding_institution_ids":["https://openalex.org/I141945490"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04321067,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"80","issue":null,"first_page":"7440","last_page":"7444"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9708999991416931,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9700999855995178,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6298902034759521},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.6072988510131836},{"id":"https://openalex.org/keywords/separable-space","display_name":"Separable space","score":0.5607478618621826},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24854612350463867}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6298902034759521},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.6072988510131836},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.5607478618621826},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24854612350463867},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10447312","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447312","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1583837637","https://openalex.org/W1607832978","https://openalex.org/W2136398689","https://openalex.org/W2790253170","https://openalex.org/W2911495555","https://openalex.org/W2914141962","https://openalex.org/W4287748599","https://openalex.org/W6745276634","https://openalex.org/W6748155593","https://openalex.org/W6748742374","https://openalex.org/W6749015878","https://openalex.org/W6752591435","https://openalex.org/W6761030284","https://openalex.org/W6768178264","https://openalex.org/W6779598207","https://openalex.org/W6780430711","https://openalex.org/W6784903187","https://openalex.org/W6796720488"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W2009525028","https://openalex.org/W2390279801","https://openalex.org/W4321064619","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109"],"abstract_inverted_index":{"In":[0,81],"recent":[1,50],"research":[2,89],"aimed":[3],"at":[4],"understanding":[5],"the":[6,35,39],"strong":[7],"generalization":[8,67,94,127],"performance":[9,128],"of":[10,88,121,131],"simple":[11],"gradient-based":[12],"methods":[13],"on":[14,27],"overparameterized":[15],"models,":[16],"it":[17],"has":[18],"been":[19,70],"demonstrated":[20],"that":[21,54,111],"when":[22],"training":[23,122],"a":[24,58],"linear":[25],"predictor":[26,36],"separable":[28],"data":[29],"with":[30],"an":[31],"exponentially-tailed":[32],"loss":[33],"function,":[34],"converges":[37],"towards":[38],"max-margin":[40],"classifier":[41],"direction,":[42],"explaining":[43],"its":[44],"resistance":[45],"to":[46],"overfitting":[47,55],"asymptotically.":[48],"Moreover,":[49],"findings":[51],"have":[52,69],"shown":[53],"is":[56],"not":[57],"concern":[59],"even":[60],"in":[61,119,129],"finite-time":[62,66,93],"scenarios":[63],"(non-asymptotically),":[64],"as":[65,114],"bounds":[68,95],"derived":[71],"for":[72,96],"gradient":[73,75],"flow,":[74],"descent":[76],"(GD),":[77],"and":[78,90,104],"stochastic":[79],"GD.":[80,107],"this":[82,86],"work,":[83],"we":[84],"extend":[85],"line":[87],"obtain":[91],"new":[92],"other":[97],"popular":[98],"first-order":[99],"methods,":[100,113],"namely":[101],"normalized":[102],"GD":[103],"Nesterov\u2019s":[105],"accelerated":[106],"Our":[108],"results":[109],"reveal":[110],"these":[112],"they":[115],"converge":[116],"more":[117],"rapidly":[118],"terms":[120,130],"loss,":[123],"also":[124],"exhibit":[125],"enhanced":[126],"test":[132],"error.":[133]},"counts_by_year":[],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
