{"id":"https://openalex.org/W3003534552","doi":"https://doi.org/10.1109/tnnls.2019.2963066","title":"PID Controller-Based Stochastic Optimization Acceleration for Deep Neural Networks","display_name":"PID Controller-Based Stochastic Optimization Acceleration for Deep Neural Networks","publication_year":2020,"publication_date":"2020-01-28","ids":{"openalex":"https://openalex.org/W3003534552","doi":"https://doi.org/10.1109/tnnls.2019.2963066","mag":"3003534552","pmid":"https://pubmed.ncbi.nlm.nih.gov/32011265"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2019.2963066","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2963066","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028229824","display_name":"Haoqian Wang","orcid":"https://orcid.org/0000-0003-2792-8469"},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoqian Wang","raw_affiliation_strings":["Shenzhen Institute of Future Media Technology, Shenzhen, China","Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Future Media Technology, Shenzhen, China","institution_ids":["https://openalex.org/I158809036"]},{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101547333","display_name":"Yi Luo","orcid":"https://orcid.org/0000-0002-3727-5679"},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Luo","raw_affiliation_strings":["Shenzhen Institute of Future Media Technology, Shenzhen, China","Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Future Media Technology, Shenzhen, China","institution_ids":["https://openalex.org/I158809036"]},{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059454224","display_name":"Wangpeng An","orcid":"https://orcid.org/0000-0002-1869-1837"},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wangpeng An","raw_affiliation_strings":["Shenzhen Institute of Future Media Technology, Shenzhen, China","Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Future Media Technology, Shenzhen, China","institution_ids":["https://openalex.org/I158809036"]},{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018132697","display_name":"Qingyun Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qingyun Sun","raw_affiliation_strings":["Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042967567","display_name":"Jun Xu","orcid":"https://orcid.org/0000-0002-1602-538X"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Xu","raw_affiliation_strings":["College of Computer Science, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100433899","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0002-2078-4215"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]},{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["Artificial Intelligence Center, Alibaba DAMO Academy, Hangzhou, China","The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Center, Alibaba DAMO Academy, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]},{"raw_affiliation_string":"The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5028229824"],"corresponding_institution_ids":["https://openalex.org/I158809036","https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":4.5133,"has_fulltext":false,"cited_by_count":82,"citation_normalized_percentile":{"value":0.95762965,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"31","issue":"12","first_page":"5079","last_page":"5091"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pid-controller","display_name":"PID controller","score":0.8999629020690918},{"id":"https://openalex.org/keywords/overshoot","display_name":"Overshoot (microwave communication)","score":0.7746864557266235},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7240632772445679},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6728925704956055},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.6446970701217651},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6241926550865173},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.5490744709968567},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5173661112785339},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.500145673751831},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4545939266681671},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.42580902576446533},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.39947301149368286},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.17257347702980042},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09571138024330139},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.06605598330497742}],"concepts":[{"id":"https://openalex.org/C47116090","wikidata":"https://www.wikidata.org/wiki/Q716829","display_name":"PID controller","level":3,"score":0.8999629020690918},{"id":"https://openalex.org/C2780323453","wikidata":"https://www.wikidata.org/wiki/Q7113957","display_name":"Overshoot (microwave communication)","level":2,"score":0.7746864557266235},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7240632772445679},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6728925704956055},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.6446970701217651},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6241926550865173},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.5490744709968567},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5173661112785339},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.500145673751831},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4545939266681671},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.42580902576446533},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.39947301149368286},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.17257347702980042},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09571138024330139},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.06605598330497742},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C536315585","wikidata":"https://www.wikidata.org/wiki/Q7698332","display_name":"Temperature control","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013269","descriptor_name":"Stochastic Processes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013269","descriptor_name":"Stochastic Processes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013269","descriptor_name":"Stochastic Processes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D057488","descriptor_name":"Visual Prosthesis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057488","descriptor_name":"Visual Prosthesis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057488","descriptor_name":"Visual Prosthesis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2019.2963066","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2963066","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:32011265","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32011265","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3967380794","display_name":null,"funder_award_id":"61531014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4958032829","display_name":null,"funder_award_id":"61831014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6726852810","display_name":null,"funder_award_id":"61571259","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":92,"referenced_works":["https://openalex.org/W104184427","https://openalex.org/W114517082","https://openalex.org/W639708223","https://openalex.org/W1481834144","https://openalex.org/W1492417045","https://openalex.org/W1522301498","https://openalex.org/W1552300625","https://openalex.org/W1567302070","https://openalex.org/W1690739335","https://openalex.org/W1789336918","https://openalex.org/W1978811804","https://openalex.org/W1980287119","https://openalex.org/W1988720110","https://openalex.org/W1996901117","https://openalex.org/W2022508996","https://openalex.org/W2064675550","https://openalex.org/W2067400662","https://openalex.org/W2096590200","https://openalex.org/W2097460613","https://openalex.org/W2099471712","https://openalex.org/W2104636679","https://openalex.org/W2107537851","https://openalex.org/W2112796928","https://openalex.org/W2117539524","https://openalex.org/W2119144962","https://openalex.org/W2132211083","https://openalex.org/W2140246545","https://openalex.org/W2146502635","https://openalex.org/W2165314520","https://openalex.org/W2167215970","https://openalex.org/W2171438612","https://openalex.org/W2175402905","https://openalex.org/W2183182206","https://openalex.org/W2194775991","https://openalex.org/W2212703438","https://openalex.org/W2302255633","https://openalex.org/W2319130426","https://openalex.org/W2524428287","https://openalex.org/W2528333963","https://openalex.org/W2549139847","https://openalex.org/W2551176409","https://openalex.org/W2564807118","https://openalex.org/W2798391154","https://openalex.org/W2921968712","https://openalex.org/W2928560789","https://openalex.org/W2936995161","https://openalex.org/W2947944300","https://openalex.org/W2950248853","https://openalex.org/W2950967261","https://openalex.org/W2962795635","https://openalex.org/W2962851801","https://openalex.org/W2962949994","https://openalex.org/W2962965870","https://openalex.org/W2963042606","https://openalex.org/W2963304263","https://openalex.org/W2963319203","https://openalex.org/W2963367891","https://openalex.org/W2963446712","https://openalex.org/W2964102336","https://openalex.org/W2964118293","https://openalex.org/W2964121744","https://openalex.org/W2964137095","https://openalex.org/W2964299589","https://openalex.org/W2980070341","https://openalex.org/W3118608800","https://openalex.org/W4214592884","https://openalex.org/W4285719527","https://openalex.org/W4302375066","https://openalex.org/W4320013936","https://openalex.org/W4387688680","https://openalex.org/W6604254268","https://openalex.org/W6631190155","https://openalex.org/W6637551013","https://openalex.org/W6638020065","https://openalex.org/W6649495467","https://openalex.org/W6666877243","https://openalex.org/W6677580257","https://openalex.org/W6680009829","https://openalex.org/W6681435938","https://openalex.org/W6684563725","https://openalex.org/W6685537299","https://openalex.org/W6688167117","https://openalex.org/W6698183232","https://openalex.org/W6701650085","https://openalex.org/W6713132643","https://openalex.org/W6726275242","https://openalex.org/W6727208969","https://openalex.org/W6731191353","https://openalex.org/W6761030284","https://openalex.org/W6761067243","https://openalex.org/W6763564312","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W4293868274","https://openalex.org/W4386412075","https://openalex.org/W4389515241","https://openalex.org/W2810278913","https://openalex.org/W2110981444","https://openalex.org/W2588803791","https://openalex.org/W2895097035","https://openalex.org/W4206903459","https://openalex.org/W2754816816","https://openalex.org/W4366280654"],"abstract_inverted_index":{"Deep":[0],"neural":[1],"networks":[2,26],"(DNNs)":[3],"are":[4,135],"widely":[5],"used":[6,47],"and":[7,18,55,89,112,131,170,188],"demonstrated":[8],"their":[9],"power":[10],"in":[11,62],"many":[12],"applications,":[13],"such":[14,73],"as":[15,74],"computer":[16,168],"vision":[17,169],"pattern":[19],"recognition.":[20],"However,":[21,61],"the":[22,44,63,75,82,91,105,109,124,128,143,175,193],"training":[23,83],"of":[24,43,65,93,133,177],"these":[25],"can":[27],"be":[28,35],"time":[29],"consuming.":[30],"Such":[31],"a":[32,98,118],"problem":[33,79,88,145],"could":[34],"alleviated":[36],"by":[37,147],"using":[38],"efficient":[39],"optimizers.":[40],"As":[41],"one":[42],"most":[45],"commonly":[46],"optimizers,":[48],"stochastic":[49],"gradient":[50],"descent-momentum":[51],"(SGD-M)":[52],"uses":[53],"past":[54],"present":[56],"gradients":[57,134],"for":[58],"parameter":[59],"updates.":[60],"process":[64],"network":[66,125],"training,":[67],"SGD-M":[68,113],"may":[69],"encounter":[70],"some":[71],"drawbacks,":[72],"overshoot":[76,144],"phenomenon.":[77],"This":[78],"would":[80],"slow":[81],"convergence.":[84],"To":[85],"alleviate":[86],"this":[87],"accelerate":[90],"convergence":[92],"DNN":[94,153],"optimization,":[95],"we":[96,103],"propose":[97,117],"proportional-integral-derivative":[99],"(PID)":[100],"approach.":[101],"Specifically,":[102],"investigate":[104],"intrinsic":[106],"relationships":[107],"between":[108],"PID-based":[110,119,140],"controller":[111],"first.":[114],"We":[115,190],"further":[116],"optimization":[120,141],"algorithm":[121],"to":[122,159],"update":[123],"parameters,":[126],"where":[127],"past,":[129],"current,":[130],"change":[132],"exploited.":[136],"Consequently,":[137],"our":[138,178],"proposed":[139],"alleviates":[142],"suffered":[146],"SGD-M.":[148],"When":[149],"tested":[150],"on":[151,180],"popular":[152],"architectures,":[154],"it":[155],"also":[156],"obtains":[157],"up":[158],"50%":[160],"acceleration":[161],"with":[162],"competitive":[163],"accuracy.":[164],"Extensive":[165],"experiments":[166],"about":[167],"natural":[171],"language":[172],"processing":[173],"demonstrate":[174],"effectiveness":[176],"method":[179],"benchmark":[181],"data":[182],"sets,":[183],"including":[184],"CIFAR10,":[185],"CIFAR100,":[186],"Tiny-ImageNet,":[187],"PTB.":[189],"have":[191],"released":[192],"code":[194],"at":[195],"https://github.com/tensorboy/PIDOptimizer.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":14},{"year":2020,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
