{"id":"https://openalex.org/W4407802475","doi":"https://doi.org/10.1007/s10994-025-06738-9","title":"Empirical risk minimization in the interpolating regime with application to neural network learning","display_name":"Empirical risk minimization in the interpolating regime with application to neural network learning","publication_year":2025,"publication_date":"2025-02-21","ids":{"openalex":"https://openalex.org/W4407802475","doi":"https://doi.org/10.1007/s10994-025-06738-9"},"language":"en","primary_location":{"id":"doi:10.1007/s10994-025-06738-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-025-06738-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-025-06738-9.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10994-025-06738-9.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074351427","display_name":"Nicole M\u00fccke","orcid":"https://orcid.org/0000-0002-5708-1820"},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Nicole M\u00fccke","raw_affiliation_strings":["Institute for Mathematical Stochastics, Technical University of Braunschweig, Brunswick, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Mathematical Stochastics, Technical University of Braunschweig, Brunswick, Germany","institution_ids":["https://openalex.org/I94509681"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001083977","display_name":"Ingo Steinwart","orcid":"https://orcid.org/0000-0002-4436-7109"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Ingo Steinwart","raw_affiliation_strings":["Institute for Stochastics and Applications, University of Stuttgart, Stuttgart, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Stochastics and Applications, University of Stuttgart, Stuttgart, Germany","institution_ids":["https://openalex.org/I100066346"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5074351427"],"corresponding_institution_ids":["https://openalex.org/I94509681"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":2.7855,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89248562,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"114","issue":"4","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/empirical-risk-minimization","display_name":"Empirical risk minimization","score":0.8819307088851929},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7245607376098633},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6445461511611938},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.5620715618133545},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5421304702758789},{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.5132303237915039},{"id":"https://openalex.org/keywords/minification","display_name":"Minification","score":0.5087230801582336},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.4683650732040405},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.46274736523628235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4337505102157593},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.42029309272766113},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3947663903236389},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3902754485607147},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39020735025405884},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.2644028961658478},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.20322883129119873}],"concepts":[{"id":"https://openalex.org/C107321475","wikidata":"https://www.wikidata.org/wiki/Q5374254","display_name":"Empirical risk minimization","level":2,"score":0.8819307088851929},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7245607376098633},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6445461511611938},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.5620715618133545},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5421304702758789},{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.5132303237915039},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.5087230801582336},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.4683650732040405},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.46274736523628235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4337505102157593},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.42029309272766113},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3947663903236389},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3902754485607147},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39020735025405884},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2644028961658478},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.20322883129119873},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10994-025-06738-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-025-06738-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-025-06738-9.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10994-025-06738-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-025-06738-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-025-06738-9.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"No poverty","score":0.6200000047683716,"id":"https://metadata.un.org/sdg/1"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322958","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407802475.pdf","grobid_xml":"https://content.openalex.org/works/W4407802475.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W335436902","https://openalex.org/W1484867920","https://openalex.org/W1489087445","https://openalex.org/W1511694993","https://openalex.org/W1564947197","https://openalex.org/W2015143722","https://openalex.org/W2109999160","https://openalex.org/W2130315424","https://openalex.org/W2148603752","https://openalex.org/W2566079294","https://openalex.org/W2776610675","https://openalex.org/W2787302432","https://openalex.org/W2807299122","https://openalex.org/W2807842867","https://openalex.org/W2886067286","https://openalex.org/W2895992958","https://openalex.org/W2899748887","https://openalex.org/W2900103278","https://openalex.org/W2914852400","https://openalex.org/W2922153390","https://openalex.org/W2946302218","https://openalex.org/W2946963372","https://openalex.org/W2950220847","https://openalex.org/W2971127900","https://openalex.org/W2975935587","https://openalex.org/W2990138404","https://openalex.org/W2992097177","https://openalex.org/W3018252856","https://openalex.org/W3034952177","https://openalex.org/W3046835365","https://openalex.org/W3093129138","https://openalex.org/W3102511045","https://openalex.org/W3135891919","https://openalex.org/W3158239976","https://openalex.org/W3169697178","https://openalex.org/W3172995164","https://openalex.org/W3180080120","https://openalex.org/W3184387346","https://openalex.org/W3186740493","https://openalex.org/W3201938571","https://openalex.org/W3210660362","https://openalex.org/W4236362309","https://openalex.org/W4388506988","https://openalex.org/W4393190247","https://openalex.org/W4400601118","https://openalex.org/W6730267373","https://openalex.org/W6763725367","https://openalex.org/W6792841710","https://openalex.org/W6797630644","https://openalex.org/W7071374342"],"related_works":["https://openalex.org/W3013650182","https://openalex.org/W2989283631","https://openalex.org/W4249605382","https://openalex.org/W4313491656","https://openalex.org/W2155195660","https://openalex.org/W2060518740","https://openalex.org/W4367626110","https://openalex.org/W2052343155","https://openalex.org/W2262246290","https://openalex.org/W2103875979"],"abstract_inverted_index":{"Abstract":[0],"A":[1],"common":[2],"strategy":[3],"to":[4,11,17,64,94,114],"train":[5,18],"deep":[6],"neural":[7],"networks":[8],"(DNNs)":[9],"is":[10,57],"use":[12],"very":[13,139],"large":[14,77,126,166],"architectures":[15],"and":[16,96,121,164],"them":[19],"until":[20],"they":[21],"(almost)":[22],"achieve":[23],"zero":[24,107,161],"training":[25,108,162],"error.":[26,109],"Empirically":[27],"observed":[28],"good":[29,140],"generalization":[30,66],"performance":[31],"on":[32],"test":[33],"data,":[34],"even":[35],"in":[36,52,69,146],"the":[37,49,147,154],"presence":[38],"of":[39,41],"lots":[40],"label":[42],"noise,":[43],"corroborate":[44],"such":[45],"a":[46],"procedure.":[47],"On":[48],"other":[50],"hand,":[51],"statistical":[53,141],"learning":[54,98],"theory":[55],"it":[56],"known":[58],"that":[59,123,153],"over-fitting":[60],"models":[61],"may":[62],"lead":[63],"poor":[65],"properties,":[67],"occurring":[68],"e.g.":[70],"empirical":[71,135],"risk":[72,136],"minimization":[73],"(ERM)":[74],"over":[75],"too":[76],"hypotheses":[78,127],"classes.":[79],"Inspired":[80],"by":[81],"this":[82,112],"contradictory":[83],"behavior,":[84],"so-called":[85],"interpolation":[86],"methods":[87,99,116],"have":[88],"recently":[89],"received":[90],"much":[91],"attention,":[92],"leading":[93],"consistent":[95],"optimally":[97],"for,":[100],"e.g.,":[101],"some":[102,133],"local":[103],"averaging":[104],"schemes":[105],"with":[106,160],"We":[110],"extend":[111],"analysis":[113],"ERM-like":[115],"for":[117,124,158],"least":[118],"squares":[119],"regression":[120],"show":[122,152],"certain,":[125],"classes":[128],"called":[129],"inflated":[130],"histograms":[131],",":[132],"interpolating":[134],"minimizers":[137],"enjoy":[138],"guarantees":[142],"while":[143],"others":[144],"fail":[145],"worst":[148],"sense.":[149],"Moreover,":[150],"we":[151],"same":[155],"phenomenon":[156],"occurs":[157],"DNNs":[159],"error":[163],"sufficiently":[165],"architectures.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
