{"id":"https://openalex.org/W3108109508","doi":"https://doi.org/10.1109/tpds.2020.3041474","title":"Model Parallelism Optimization for Distributed Inference via Decoupled CNN Structure","display_name":"Model Parallelism Optimization for Distributed Inference via Decoupled CNN Structure","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3108109508","doi":"https://doi.org/10.1109/tpds.2020.3041474","mag":"3108109508"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2020.3041474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3041474","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024085713","display_name":"Jiangsu Du","orcid":"https://orcid.org/0000-0003-4707-9492"},"institutions":[{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]},{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiangsu Du","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105923667","display_name":"Xin Zhu","orcid":"https://orcid.org/0000-0002-4376-0806"},"institutions":[{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]},{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Zhu","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002840650","display_name":"Minghua Shen","orcid":"https://orcid.org/0000-0003-4747-8020"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]},{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minghua Shen","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069366771","display_name":"Yunfei Du","orcid":"https://orcid.org/0000-0001-6832-0519"},"institutions":[{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]},{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunfei Du","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101633465","display_name":"Yutong Lu","orcid":"https://orcid.org/0000-0001-5315-3375"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]},{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong Lu","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023506057","display_name":"Nong Xiao","orcid":"https://orcid.org/0000-0002-2166-977X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]},{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nong Xiao","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056096237","display_name":"Xiangke Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112812","display_name":"National Supercomputing Center in Shenzhen","ror":"https://ror.org/02291hh73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112812"]},{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangke Liao","raw_affiliation_strings":["National Supercomputer Center in Guangzhou, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputer Center in Guangzhou, Guangzhou, China","institution_ids":["https://openalex.org/I4210112812"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5024085713"],"corresponding_institution_ids":["https://openalex.org/I157773358","https://openalex.org/I4210112812"],"apc_list":null,"apc_paid":null,"fwci":2.0517,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.89246824,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8724501729011536},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.735812783241272},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.6389921307563782},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6263208389282227},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5875139832496643},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.5247367024421692},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.46788209676742554},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.3602333962917328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23378372192382812}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8724501729011536},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.735812783241272},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.6389921307563782},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6263208389282227},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5875139832496643},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.5247367024421692},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.46788209676742554},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.3602333962917328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23378372192382812},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2020.3041474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3041474","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G115388578","display_name":null,"funder_award_id":"61802446","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1598866093","https://openalex.org/W1686810756","https://openalex.org/W1977295820","https://openalex.org/W2011501918","https://openalex.org/W2108598243","https://openalex.org/W2162390675","https://openalex.org/W2194775991","https://openalex.org/W2465324213","https://openalex.org/W2612193523","https://openalex.org/W2707890836","https://openalex.org/W2745269232","https://openalex.org/W2774405331","https://openalex.org/W2794478957","https://openalex.org/W2799197246","https://openalex.org/W2802615216","https://openalex.org/W2804032941","https://openalex.org/W2883780447","https://openalex.org/W2889647155","https://openalex.org/W2911382970","https://openalex.org/W2915478146","https://openalex.org/W2922395136","https://openalex.org/W2931092525","https://openalex.org/W2962711501","https://openalex.org/W2962747323","https://openalex.org/W2962835968","https://openalex.org/W2963125010","https://openalex.org/W2963287528","https://openalex.org/W2963363373","https://openalex.org/W2963947383","https://openalex.org/W2963993763","https://openalex.org/W2964264300","https://openalex.org/W2969388332","https://openalex.org/W2970838493","https://openalex.org/W2970971581","https://openalex.org/W2971383048","https://openalex.org/W2972087877","https://openalex.org/W2991040477","https://openalex.org/W3101426332","https://openalex.org/W4295312788","https://openalex.org/W6635810480","https://openalex.org/W6637373629","https://openalex.org/W6683722107","https://openalex.org/W6739917289","https://openalex.org/W6751349269","https://openalex.org/W6754777574","https://openalex.org/W6756718674","https://openalex.org/W6759144272","https://openalex.org/W6766978945"],"related_works":["https://openalex.org/W2950520577","https://openalex.org/W1501159154","https://openalex.org/W2003935582","https://openalex.org/W74409296","https://openalex.org/W1554644772","https://openalex.org/W2494130044","https://openalex.org/W2468095077","https://openalex.org/W29548032","https://openalex.org/W2593878938","https://openalex.org/W305742777"],"abstract_inverted_index":{"It":[0,86,106,138],"is":[1,34,45,76,83,103,107,135],"promising":[2],"to":[3,21,36,65,93,112,122,142,161,181],"deploy":[4],"CNN":[5,30,43,63,97],"inference":[6,58,71,187],"on":[7,72,109,167],"local":[8],"end-user":[9,73],"devices":[10,178],"for":[11,69,99,145],"high-accuracy":[12],"and":[13,25,90,117,148,193],"time-sensitive":[14],"applications.":[15],"Model":[16],"parallelism":[17,39,68,141],"has":[18],"the":[19,41,95,114,124,152,163,175,186],"potential":[20],"provide":[22],"high":[23,130],"throughput":[24],"low":[26],"latency":[27],"in":[28,151],"distributed":[29,70,169],"inference.":[31],"However,":[32],"it":[33],"non-trivial":[35],"use":[37,157],"model":[38,44,67,100],"as":[40],"original":[42,96],"inherently":[46],"tightly-coupled":[47],"structure.":[48],"In":[49],"this":[50],"article,":[51],"we":[52],"propose":[53],"DeCNN,":[54],"a":[55,168],"more":[56],"effective":[57],"approach":[59],"that":[60],"uses":[61,139],"decoupled":[62],"structure":[64,98],"optimize":[66],"devices.":[74],"DeCNN":[75,166,183],"novel":[77],"consisting":[78],"of":[79,132,165,177,188],"three":[80],"schemes.":[81],"Scheme-1":[82],"structure-level":[84],"optimization.":[85,105,137],"exploits":[87],"group":[88,111],"convolution":[89],"channel":[91,110],"shuffle":[92],"decouple":[94],"parallelism.":[101,133],"Scheme-2":[102],"partition-level":[104],"based":[108],"partition":[113,123],"convolutional":[115],"layers,":[116,127],"then":[118],"leverages":[119],"input-based":[120],"method":[121],"fully":[125],"connected":[126],"further":[128],"exposing":[129],"degree":[131],"Scheme-3":[134],"communication-level":[136],"inter-sample":[140],"hide":[143],"communications":[144],"better":[146],"performance":[147],"robustness,":[149],"especially":[150],"weak":[153],"network":[154],"connections.":[155],"We":[156],"ImageNet":[158],"classification":[159],"task":[160],"evaluate":[162],"effectiveness":[164],"multi-ARM":[170],"platform.":[171],"Notably,":[172],"when":[173],"using":[174],"number":[176],"from":[179],"1":[180],"4,":[182],"can":[184],"accelerate":[185],"large-scale":[189],"ResNet-50":[190],"by":[191],"3.21\u00d7,":[192],"reduce":[194],"65.3":[195],"percent":[196,201],"memory":[197],"footprint,":[198],"with":[199],"1.29":[200],"accuracy":[202],"improvement.":[203]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
