{"id":"https://openalex.org/W4393902888","doi":"https://doi.org/10.1117/12.3023413","title":"A data parallel approach for distributed neural networks to achieve faster convergence","display_name":"A data parallel approach for distributed neural networks to achieve faster convergence","publication_year":2024,"publication_date":"2024-04-03","ids":{"openalex":"https://openalex.org/W4393902888","doi":"https://doi.org/10.1117/12.3023413"},"language":"en","primary_location":{"id":"doi:10.1117/12.3023413","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1117/12.3023413","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sixteenth International Conference on Machine Vision (ICMV 2023)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050233273","display_name":"C. Nagaraju","orcid":"https://orcid.org/0000-0003-1617-6011"},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Nagaraju C","raw_affiliation_strings":["Indian Institute of Technology Hyderabad (India)"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology Hyderabad (India)","institution_ids":["https://openalex.org/I65181880"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049663270","display_name":"Yenda Ramesh","orcid":"https://orcid.org/0000-0001-8232-8269"},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"YENDA RAMESH","raw_affiliation_strings":["Indian Institute of Technology Hyderabad (India)"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology Hyderabad (India)","institution_ids":["https://openalex.org/I65181880"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012566120","display_name":"C. Krishna Mohan","orcid":"https://orcid.org/0000-0002-7316-0836"},"institutions":[{"id":"https://openalex.org/I65181880","display_name":"Indian Institute of Technology Hyderabad","ror":"https://ror.org/01j4v3x97","country_code":"IN","type":"education","lineage":["https://openalex.org/I65181880"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Krishna Mohan C","raw_affiliation_strings":["Indian Institute of Technology Hyderabad (India)"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology Hyderabad (India)","institution_ids":["https://openalex.org/I65181880"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5050233273"],"corresponding_institution_ids":["https://openalex.org/I65181880"],"apc_list":null,"apc_paid":null,"fwci":5.7519,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.97004465,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"29","last_page":"29"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8345699310302734},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.675195574760437},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5631550550460815},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5613110661506653},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5564238429069519},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5119379758834839},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4988877773284912},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.4546038508415222},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4501030445098877},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.44083619117736816},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4212581515312195},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39495915174484253},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3902779221534729},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.38754546642303467},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3748919367790222},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37353143095970154},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.20911157131195068}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8345699310302734},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.675195574760437},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5631550550460815},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5613110661506653},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5564238429069519},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5119379758834839},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4988877773284912},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.4546038508415222},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4501030445098877},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44083619117736816},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4212581515312195},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39495915174484253},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3902779221534729},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.38754546642303467},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3748919367790222},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37353143095970154},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20911157131195068},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1117/12.3023413","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1117/12.3023413","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sixteenth International Conference on Machine Vision (ICMV 2023)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W2107469355","https://openalex.org/W2469490737","https://openalex.org/W2563424502","https://openalex.org/W2612690371","https://openalex.org/W2617766261","https://openalex.org/W2734775742","https://openalex.org/W2788193959","https://openalex.org/W2912500072","https://openalex.org/W2950346378","https://openalex.org/W2951781666","https://openalex.org/W2966527647","https://openalex.org/W3093502740","https://openalex.org/W4205502579","https://openalex.org/W4237040408","https://openalex.org/W6638783484","https://openalex.org/W6676133050","https://openalex.org/W6684191040","https://openalex.org/W6720242923","https://openalex.org/W6728975057","https://openalex.org/W6738460352","https://openalex.org/W6741131401","https://openalex.org/W6741986022","https://openalex.org/W6746200960","https://openalex.org/W6748425271","https://openalex.org/W6753469380","https://openalex.org/W6766249961","https://openalex.org/W6784072064","https://openalex.org/W6785294077"],"related_works":["https://openalex.org/W2950520577","https://openalex.org/W1554644772","https://openalex.org/W2003935582","https://openalex.org/W2494130044","https://openalex.org/W3170887803","https://openalex.org/W2963831937","https://openalex.org/W74409296","https://openalex.org/W3209384898","https://openalex.org/W4400951174","https://openalex.org/W1595834484"],"abstract_inverted_index":{"The":[0,291],"availability":[1],"of":[2,41,82,122,135,155,160,194,207,211,249,277],"large":[3,21],"datasets":[4,26,327],"has":[5,33,145],"significantly":[6],"contributed":[7],"to":[8,51,73,147,162,168,190,263,270,309,314],"recent":[9],"advancements":[10],"in":[11,198,299],"deep":[12,54,201,301],"Convolutional":[13],"Neural":[14],"Network":[15],"(CNN)":[16],"models.":[17],"However,":[18],"training":[19,45],"a":[20,28,205,222],"CNN":[22],"model":[23,60],"using":[24],"such":[25,328],"is":[27,115],"time-consuming":[29],"task.":[30],"This":[31,233],"issue":[32],"been":[34],"addressed":[35],"by":[36,126,267,281],"the":[37,44,66,80,97,103,118,133,153,158,173,192,199,209,212,216,256,259],"parallelization":[38],"and":[39,59,157,175,225,230,261,307,332],"distribution":[40,137,210],"data/model":[42],"during":[43],"process.":[46],"There":[47],"are":[48],"two":[49,128,186],"ways":[50],"implement":[52],"distributed":[53,200,246,300],"learning":[55,202,302],"processes:":[56],"data":[57,123,195,213,247,319],"parallelism":[58,63],"parallelism.":[61],"Data":[62],"involves":[64],"distributing":[65],"dataset":[67,136],"across":[68,138,325],"multiple":[69,326],"workers,":[70,140,176],"allowing":[71],"them":[72],"process":[74],"different":[75],"portions":[76],"simultaneously.":[77],"While":[78],"increasing":[79],"number":[81],"workers":[83,181,262],"can":[84,101],"reduce":[85,169],"computation":[86,108,120,279],"time,":[87],"it":[88],"also":[89],"introduces":[90],"additional":[91],"communication":[92,99,170,257,305],"time.":[93,109],"In":[94,110],"some":[95],"cases,":[96],"increased":[98],"time":[100,121,280],"outweigh":[102],"benefits":[104],"gained":[105],"from":[106],"reduced":[107],"this":[111],"paper,":[112],"our":[113,275],"focus":[114],"on":[116,244],"reducing":[117,278],"overall":[119],"parallel":[124,196],"approach":[125,197,234],"employing":[127,296],"strategies.":[129],"First,":[130],"we":[131,151,188,272],"emphasize":[132],"preservation":[134],"all":[139,237],"ensuring":[141],"that":[142,236,295,316],"each":[143,219],"worker":[144,238],"access":[146],"representative":[148],"data.":[149],"Second,":[150],"explore":[152],"localization":[154],"parameters":[156,254],"quantization":[159],"gradients":[161,264,269],"three":[163],"levels:":[164],"{-1,":[165],"0,":[166],"1}":[167],"delays":[171],"between":[172,180,258],"server":[174,260],"as":[177,179,329],"well":[178],"themselves.":[182],"By":[183],"adopting":[184],"these":[185,297],"strategies,":[187],"aim":[189],"enhance":[191],"performance":[193],"processes.":[203],"As":[204],"result":[206],"preserving":[208],"while":[214],"sampling":[215],"entire":[217],"data,":[218],"partition":[220],"retains":[221],"similar":[223],"mean":[224],"variance":[226],"(capturing":[227],"important":[228],"first":[229],"second-order":[231],"statistics).":[232],"guarantees":[235],"machines":[239],"train":[240],"their":[241],"local":[242],"models":[243],"uniformly":[245],"instead":[248],"random":[250,318],"distribution.":[251],"Additionally,":[252],"localizing":[253],"limits":[255],"only.":[265],"Furthermore,":[266],"quantizing":[268],"2-bits,":[271],"successfully":[273],"achieve":[274],"objective":[276],"enabling":[282],"faster":[283,310],"convergence":[284,311],"without":[285],"compromising":[286],"test":[287],"or":[288],"validation":[289],"accuracy.":[290],"experimental":[292],"results":[293],"demonstrate":[294],"strategies":[298],"effectively":[303],"reduces":[304],"overhead":[306],"leads":[308],"when":[312],"compared":[313],"methods":[315],"utilize":[317],"sampling.":[320],"These":[321],"improvements":[322],"were":[323],"observed":[324],"MNIST,":[330],"CIFAR-10,":[331],"Tiny":[333],"ImageNet.":[334]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":20}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
