{"id":"https://openalex.org/W4409363922","doi":"https://doi.org/10.1609/aaai.v39i19.34269","title":"On Local Overfitting and Forgetting in Deep Neural Networks","display_name":"On Local Overfitting and Forgetting in Deep Neural Networks","publication_year":2025,"publication_date":"2025-04-11","ids":{"openalex":"https://openalex.org/W4409363922","doi":"https://doi.org/10.1609/aaai.v39i19.34269"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v39i19.34269","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i19.34269","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34269/36424","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34269/36424","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063110000","display_name":"Uri Stern","orcid":null},"institutions":[{"id":"https://openalex.org/I197251160","display_name":"Hebrew University of Jerusalem","ror":"https://ror.org/03qxff017","country_code":"IL","type":"education","lineage":["https://openalex.org/I197251160"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Uri Stern","raw_affiliation_strings":["Hebrew University of Jerusalem"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hebrew University of Jerusalem","institution_ids":["https://openalex.org/I197251160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115539693","display_name":"Tomer Yaacoby","orcid":null},"institutions":[{"id":"https://openalex.org/I197251160","display_name":"Hebrew University of Jerusalem","ror":"https://ror.org/03qxff017","country_code":"IL","type":"education","lineage":["https://openalex.org/I197251160"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Tomer Yaacoby","raw_affiliation_strings":["Hebrew University of Jerusalem"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hebrew University of Jerusalem","institution_ids":["https://openalex.org/I197251160"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000206190","display_name":"Daphna Weinshall","orcid":null},"institutions":[{"id":"https://openalex.org/I197251160","display_name":"Hebrew University of Jerusalem","ror":"https://ror.org/03qxff017","country_code":"IL","type":"education","lineage":["https://openalex.org/I197251160"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Daphna Weinshall","raw_affiliation_strings":["Hebrew University of Jerusalem"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hebrew University of Jerusalem","institution_ids":["https://openalex.org/I197251160"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5063110000"],"corresponding_institution_ids":["https://openalex.org/I197251160"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16895604,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"39","issue":"19","first_page":"20592","last_page":"20600"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9623000025749207,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9623000025749207,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.9557924270629883},{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.7856259346008301},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6459037661552429},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5756919384002686},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47190696001052856},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.42934128642082214},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3683333992958069},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3068709969520569},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.276723176240921}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.9557924270629883},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.7856259346008301},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6459037661552429},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5756919384002686},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47190696001052856},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.42934128642082214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3683333992958069},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3068709969520569},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.276723176240921}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v39i19.34269","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i19.34269","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34269/36424","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v39i19.34269","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i19.34269","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34269/36424","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320324256","display_name":"Y\u00fcksek\u00f6\u011fretim Kurulu","ror":"https://ror.org/00j1q0b46"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409363922.pdf","grobid_xml":"https://content.openalex.org/works/W4409363922.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W115006267","https://openalex.org/W1533072162","https://openalex.org/W1682403713","https://openalex.org/W2086161653","https://openalex.org/W2095705004","https://openalex.org/W2125930537","https://openalex.org/W2788800397","https://openalex.org/W2788838181","https://openalex.org/W2894972989","https://openalex.org/W2963518130","https://openalex.org/W2994081359","https://openalex.org/W2996609754","https://openalex.org/W3139424959","https://openalex.org/W4287182527","https://openalex.org/W4387799548","https://openalex.org/W6793364036","https://openalex.org/W6795229289","https://openalex.org/W6810933673","https://openalex.org/W6810938606","https://openalex.org/W6821409176"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W1574414179","https://openalex.org/W4297676672","https://openalex.org/W3009056573","https://openalex.org/W2989932438","https://openalex.org/W4387297750","https://openalex.org/W2186333919","https://openalex.org/W2786764570","https://openalex.org/W4309960894","https://openalex.org/W2728804654"],"abstract_inverted_index":{"The":[0],"infrequent":[1],"occurrence":[2],"of":[3,34,51,73,86,89,95,106,140,155,169],"overfitting":[4,26,83],"in":[5,21,67],"deep":[6,52,96,119],"neural":[7,176],"networks":[8],"is":[9],"perplexing:":[10],"contrary":[11],"to":[12,31,70,130],"theoretical":[13,104],"expectations,":[14],"increasing":[15],"model":[16,158],"size":[17],"often":[18],"enhances":[19],"performance":[20,68,154],"practice.":[22],"But":[23],"what":[24],"if":[25],"does":[27],"occur,":[28],"though":[29],"restricted":[30],"specific":[32],"sub-regions":[33],"the":[35,48,74,87,93,137,153,167],"data":[36,75],"space?":[37],"In":[38],"this":[39,60,149],"work,":[40],"we":[41,100,122],"propose":[42],"a":[43,65,102,124,141,156],"novel":[44],"score":[45,61],"that":[46,59,81,111,128],"captures":[47],"forgetting":[49],"rate":[50],"models":[53],"on":[54,136],"validation":[55],"data.":[56],"We":[57,77],"posit":[58],"quantifies":[62],"local":[63,82],"overfitting:":[64],"decline":[66],"confined":[69],"certain":[71,103],"regions":[72],"space.":[76],"then":[78],"show":[79,110],"empirically":[80],"occurs":[84],"regardless":[85],"presence":[88],"traditional":[90],"overfitting.":[91],"Using":[92],"framework":[94],"over-parametrized":[97],"linear":[98],"models,":[99],"offer":[101],"characterization":[105],"forgotten":[107,116,132],"knowledge,":[108,133],"and":[109,179],"it":[112],"correlates":[113],"with":[114,146],"knowledge":[115,147],"by":[117],"real":[118],"models.":[120],"Finally,":[121],"devise":[123],"new":[125],"ensemble":[126],"method":[127,150,171],"aims":[129],"recover":[131],"relying":[134],"solely":[135],"training":[138,180],"history":[139],"single":[142],"network.":[143],"When":[144],"combined":[145],"distillation,":[148],"will":[151],"enhance":[152],"trained":[157],"without":[159],"adding":[160],"inference":[161],"costs.":[162],"Extensive":[163],"empirical":[164],"evaluations":[165],"demonstrate":[166],"efficacy":[168],"our":[170],"across":[172],"multiple":[173],"datasets,":[174],"contemporary":[175],"network":[177],"architectures,":[178],"protocols.":[181]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
