{"id":"https://openalex.org/W4321193758","doi":"https://doi.org/10.1109/tnnls.2023.3242969","title":"Understanding Short-Range Memory Effects in Deep Neural Networks","display_name":"Understanding Short-Range Memory Effects in Deep Neural Networks","publication_year":2023,"publication_date":"2023-02-17","ids":{"openalex":"https://openalex.org/W4321193758","doi":"https://doi.org/10.1109/tnnls.2023.3242969","pmid":"https://pubmed.ncbi.nlm.nih.gov/37027555"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3242969","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3242969","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006231066","display_name":"Chengli Tan","orcid":"https://orcid.org/0000-0002-7091-898X"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chengli Tan","raw_affiliation_strings":["School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024880206","display_name":"Jiangshe Zhang","orcid":"https://orcid.org/0000-0002-8395-1180"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiangshe Zhang","raw_affiliation_strings":["School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014312349","display_name":"Junmin Liu","orcid":"https://orcid.org/0000-0002-1462-7248"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junmin Liu","raw_affiliation_strings":["School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Statistics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5006231066"],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":0.3479,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.62869662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"35","issue":"8","first_page":"10576","last_page":"10590"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.6207419633865356},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4474513530731201},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.40821895003318787},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31843364238739014},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.13693705201148987}],"concepts":[{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.6207419633865356},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4474513530731201},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.40821895003318787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31843364238739014},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.13693705201148987},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2023.3242969","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3242969","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37027555","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37027555","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4210075541","display_name":null,"funder_award_id":"62276208","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8779856710","display_name":null,"funder_award_id":"61976174","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W74712529","https://openalex.org/W157361201","https://openalex.org/W1506978447","https://openalex.org/W1512184319","https://openalex.org/W1556674487","https://openalex.org/W1677182931","https://openalex.org/W1965597743","https://openalex.org/W1969324628","https://openalex.org/W1982262355","https://openalex.org/W1994035813","https://openalex.org/W2028022601","https://openalex.org/W2031753087","https://openalex.org/W2036565370","https://openalex.org/W2047229728","https://openalex.org/W2060924910","https://openalex.org/W2062242131","https://openalex.org/W2064675550","https://openalex.org/W2088215016","https://openalex.org/W2105818147","https://openalex.org/W2112746910","https://openalex.org/W2119573964","https://openalex.org/W2119635640","https://openalex.org/W2146502635","https://openalex.org/W2217490359","https://openalex.org/W2341760625","https://openalex.org/W2552194003","https://openalex.org/W2750677477","https://openalex.org/W2768267830","https://openalex.org/W2796146910","https://openalex.org/W2912811302","https://openalex.org/W2962915600","https://openalex.org/W2963177640","https://openalex.org/W2963433607","https://openalex.org/W2981382427","https://openalex.org/W2997599645","https://openalex.org/W3084521418","https://openalex.org/W4212900503","https://openalex.org/W4237099064","https://openalex.org/W4297749952","https://openalex.org/W4300567850","https://openalex.org/W4304480522","https://openalex.org/W4385245566","https://openalex.org/W4388322985","https://openalex.org/W6631190155","https://openalex.org/W6631943919","https://openalex.org/W6681435938","https://openalex.org/W6726983090","https://openalex.org/W6733862737","https://openalex.org/W6736221594","https://openalex.org/W6736583452","https://openalex.org/W6738534199","https://openalex.org/W6739826692","https://openalex.org/W6745410505","https://openalex.org/W6747381837","https://openalex.org/W6748240843","https://openalex.org/W6751983209","https://openalex.org/W6758153731","https://openalex.org/W6763485134","https://openalex.org/W6764516180","https://openalex.org/W6767185500","https://openalex.org/W6769009116","https://openalex.org/W6771233102","https://openalex.org/W6774337062","https://openalex.org/W6778032888","https://openalex.org/W6784520297"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Stochastic":[0],"gradient":[1,29],"descent":[2],"(SGD)":[3],"is":[4,24,42,71,115,128,177],"of":[5,22,51,98,112,122,206],"fundamental":[6],"importance":[7],"in":[8,33,84,148],"deep":[9],"learning.":[10],"Despite":[11],"its":[12,15],"simplicity,":[13],"elucidating":[14],"efficacy":[16],"remains":[17],"challenging.":[18],"Conventionally,":[19],"the":[20,27,34,48,80,85,108,118,156],"success":[21],"SGD":[23,41,91,113,145,160],"ascribed":[25],"to":[26,153,171,202],"stochastic":[28,52],"noise":[30],"(SGN)":[31],"incurred":[32],"training":[35,190],"process.":[36],"Based":[37],"on":[38],"this":[39,65],"consensus,":[40],"frequently":[43],"treated":[44],"and":[45,143,175,189,199],"analyzed":[46],"as":[47,95],"Euler-Maruyama":[49],"discretization":[50,97],"differential":[53],"equations":[54],"(SDEs)":[55],"driven":[56,101,125],"by":[57,79,102,126],"either":[58],"Brownian":[59,104],"or":[60],"L\u00e9vy":[61,75],"stable":[62],"motion.":[63],"In":[64],"study,":[66],"we":[67,88],"argue":[68],"that":[69,90,159,164,179],"SGN":[70,86],"neither":[72],"Gaussian":[73],"nor":[74],"stable.":[76],"Instead,":[77],"inspired":[78],"short-range":[81,180],"correlation":[82],"emerging":[83],"series,":[87],"propose":[89],"can":[92],"be":[93],"viewed":[94],"a":[96,134,139,196,203],"an":[99,123],"SDE":[100,124],"fractional":[103],"motion":[105],"(FBM).":[106],"Accordingly,":[107],"different":[109],"convergence":[110],"behavior":[111],"dynamics":[114],"well-grounded.":[116],"Moreover,":[117],"first":[119],"passage":[120],"time":[121],"FBM":[127],"approximately":[129],"derived.":[130],"The":[131],"result":[132],"suggests":[133],"lower":[135],"escaping":[136],"rate":[137],"for":[138],"larger":[140],"Hurst":[141],"parameter,":[142],"thus,":[144],"stays":[146],"longer":[147],"flat":[149,162],"minima.":[150],"This":[151],"happens":[152],"coincide":[154],"with":[155],"well-known":[157],"phenomenon":[158],"favors":[161],"minima":[163],"generalize":[165],"well.":[166],"Extensive":[167],"experiments":[168],"are":[169],"conducted":[170],"validate":[172],"our":[173],"conjecture,":[174],"it":[176],"demonstrated":[178],"memory":[181],"effects":[182],"persist":[183],"across":[184],"various":[185],"model":[186],"architectures,":[187],"datasets,":[188],"strategies.":[191],"Our":[192],"study":[193],"opens":[194],"up":[195],"new":[197],"perspective":[198],"may":[200],"contribute":[201],"better":[204],"understanding":[205],"SGD.":[207]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
