{"id":"https://openalex.org/W3143471131","doi":"https://doi.org/10.1109/tnnls.2021.3069883","title":"Fully Decoupled Neural Network Learning Using Delayed Gradients","display_name":"Fully Decoupled Neural Network Learning Using Delayed Gradients","publication_year":2021,"publication_date":"2021-04-09","ids":{"openalex":"https://openalex.org/W3143471131","doi":"https://doi.org/10.1109/tnnls.2021.3069883","mag":"3143471131","pmid":"https://pubmed.ncbi.nlm.nih.gov/33835926"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2021.3069883","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3069883","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/174476/2/Fully%20Decoupled%20Neural%20Network%20Learning%20Using%20Delayed%20Gradients.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061256037","display_name":"Huiping Zhuang","orcid":"https://orcid.org/0000-0002-4612-5445"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Huiping Zhuang","raw_affiliation_strings":["School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100784213","display_name":"Yi Wang","orcid":"https://orcid.org/0000-0001-8659-4724"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yi Wang","raw_affiliation_strings":["School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028602831","display_name":"Qinglai Liu","orcid":"https://orcid.org/0000-0003-3869-9171"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Qinglai Liu","raw_affiliation_strings":["Temasek Laboratories, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"Temasek Laboratories, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049506273","display_name":"Zhiping Lin","orcid":"https://orcid.org/0000-0002-1587-1226"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhiping Lin","raw_affiliation_strings":["School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5061256037"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":1.5371,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.84647059,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"33","issue":"10","first_page":"6013","last_page":"6020"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7564285397529602},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7497072219848633},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.7302159070968628},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6740703582763672},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6699230670928955},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5369138121604919},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5304580926895142},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5099793672561646},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47157731652259827},{"id":"https://openalex.org/keywords/train","display_name":"Train","score":0.45218557119369507},{"id":"https://openalex.org/keywords/mathematical-proof","display_name":"Mathematical proof","score":0.4194391667842865},{"id":"https://openalex.org/keywords/stack","display_name":"Stack (abstract data type)","score":0.4136337339878082},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40385910868644714},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12289276719093323}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7564285397529602},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7497072219848633},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.7302159070968628},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6740703582763672},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6699230670928955},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5369138121604919},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5304580926895142},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5099793672561646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47157731652259827},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.45218557119369507},{"id":"https://openalex.org/C108710211","wikidata":"https://www.wikidata.org/wiki/Q11538","display_name":"Mathematical proof","level":2,"score":0.4194391667842865},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.4136337339878082},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40385910868644714},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12289276719093323},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019788","descriptor_name":"Fluorodeoxyglucose F18","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019788","descriptor_name":"Fluorodeoxyglucose F18","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019788","descriptor_name":"Fluorodeoxyglucose F18","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2021.3069883","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3069883","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:33835926","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33835926","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:dr.ntu.edu.sg:10356/174476","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/174476","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/174476/2/Fully%20Decoupled%20Neural%20Network%20Learning%20Using%20Delayed%20Gradients.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":{"id":"pmh:oai:dr.ntu.edu.sg:10356/174476","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/174476","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/174476/2/Fully%20Decoupled%20Neural%20Network%20Learning%20Using%20Delayed%20Gradients.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4140448528","display_name":null,"funder_award_id":"1922500054","funder_id":"https://openalex.org/F4320334971","funder_display_name":"Science and Engineering Research Council"}],"funders":[{"id":"https://openalex.org/F4320334971","display_name":"Science and Engineering Research Council","ror":"https://ror.org/00zgdb249"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3143471131.pdf","grobid_xml":"https://content.openalex.org/works/W3143471131.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1573503290","https://openalex.org/W1677182931","https://openalex.org/W2064675550","https://openalex.org/W2112796928","https://openalex.org/W2117539524","https://openalex.org/W2194775991","https://openalex.org/W2507556850","https://openalex.org/W2552737632","https://openalex.org/W2766752287","https://openalex.org/W2911586496","https://openalex.org/W2920582597","https://openalex.org/W2949933418","https://openalex.org/W2963433607","https://openalex.org/W2964137095","https://openalex.org/W2964319207","https://openalex.org/W2998045710","https://openalex.org/W3118608800","https://openalex.org/W4297781872","https://openalex.org/W4301239768","https://openalex.org/W6634288218","https://openalex.org/W6681151457","https://openalex.org/W6692956712","https://openalex.org/W6726238325","https://openalex.org/W6739554518","https://openalex.org/W6748424917","https://openalex.org/W6748645090","https://openalex.org/W6750269818","https://openalex.org/W6753115359","https://openalex.org/W6756718674","https://openalex.org/W6759063983","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W618248309","https://openalex.org/W2377336366","https://openalex.org/W4394650907","https://openalex.org/W154364797","https://openalex.org/W4254119641","https://openalex.org/W3196207352","https://openalex.org/W2951724202","https://openalex.org/W1568097102","https://openalex.org/W3084261076","https://openalex.org/W4390419160"],"abstract_inverted_index":{"Training":[0],"neural":[1,64,120],"networks":[2,121],"with":[3,142],"backpropagation":[4],"(BP)":[5],"requires":[6],"a":[7,33,46,63,83,171],"sequential":[8],"passing":[9],"of":[10,35,138,148],"activations":[11],"and":[12,25,69,73,150],"gradients.":[13,97],"This":[14],"has":[15],"been":[16],"recognized":[17],"as":[18],"the":[19,22,39,89,95,103,143,156],"lockings":[20],"(i.e.,":[21],"forward,":[23],"backward,":[24],"update":[26],"lockings)":[27],"among":[28],"modules":[29,68],"(each":[30],"module":[31],"contains":[32],"stack":[34],"layers)":[36],"inherited":[37],"from":[38],"BP.":[40],"In":[41],"this":[42],"brief,":[43],"we":[44],"propose":[45],"fully":[47],"decoupled":[48,172],"training":[49,117],"scheme":[50],"using":[51,75],"delayed":[52,96],"gradients":[53],"(FDG)":[54],"to":[55,87,107,122,160],"break":[56],"all":[57],"these":[58],"lockings.":[59],"The":[60],"FDG":[61,104,157],"splits":[62],"network":[65],"into":[66],"multiple":[67],"trains":[70],"them":[71],"independently":[72],"asynchronously":[74],"different":[76],"workers":[77],"(e.g.,":[78,168],"GPUs).":[79],"We":[80,152],"also":[81,153],"introduce":[82],"gradient":[84,91],"shrinking":[85],"process":[86],"reduce":[88],"stale":[90],"effect":[92],"caused":[93],"by":[94,116],"Our":[98],"theoretical":[99],"proofs":[100],"show":[101,133,154],"that":[102,155],"can":[105],"converge":[106],"critical":[108],"points":[109],"under":[110],"certain":[111],"conditions.":[112],"Experiments":[113],"are":[114],"conducted":[115],"deep":[118,166],"convolutional":[119],"perform":[123],"classification":[124],"tasks":[125],"on":[126],"several":[127],"benchmark":[128],"data":[129],"sets.":[130],"These":[131],"experiments":[132],"comparable":[134],"or":[135],"better":[136],"results":[137],"our":[139],"approach":[140],"compared":[141],"state-of-the-art":[144],"methods":[145],"in":[146,170],"terms":[147],"generalization":[149],"acceleration.":[151],"is":[158],"able":[159],"train":[161],"various":[162],"networks,":[163],"including":[164],"extremely":[165],"ones":[167],"ResNet-1202),":[169],"fashion.":[173]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
