{"id":"https://openalex.org/W2946408574","doi":"https://doi.org/10.1109/access.2019.2916550","title":"Iteration Time Prediction for CNN in Multi-GPU Platform: Modeling and Analysis","display_name":"Iteration Time Prediction for CNN in Multi-GPU Platform: Modeling and Analysis","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2946408574","doi":"https://doi.org/10.1109/access.2019.2916550","mag":"2946408574"},"language":"en","primary_location":{"id":"doi:10.1109/access.2019.2916550","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2916550","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08713989.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08713989.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020297948","display_name":"Ziqian Pei","orcid":"https://orcid.org/0000-0003-0443-9582"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ziqian Pei","raw_affiliation_strings":["CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0003-0443-9582","affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088579899","display_name":"Chensheng Li","orcid":"https://orcid.org/0000-0002-8902-6594"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chensheng Li","raw_affiliation_strings":["CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089544297","display_name":"Xiaowei Qin","orcid":"https://orcid.org/0000-0001-7296-3461"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaowei Qin","raw_affiliation_strings":["CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100375178","display_name":"Xiaohui Chen","orcid":"https://orcid.org/0000-0003-3239-2558"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaohui Chen","raw_affiliation_strings":["CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101398113","display_name":"Guo Wei","orcid":"https://orcid.org/0000-0001-9888-2408"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guo Wei","raw_affiliation_strings":["CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of Wireless-Optical Communications, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5020297948"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.1432,"has_fulltext":true,"cited_by_count":40,"citation_normalized_percentile":{"value":0.90188293,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"7","issue":null,"first_page":"64788","last_page":"64797"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8966621160507202},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.687245786190033},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.546583354473114},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5118700861930847},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4803958237171173},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4795638918876648},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47330036759376526},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.45487532019615173},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.42750269174575806},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.42515626549720764},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3203049302101135},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.22228622436523438}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8966621160507202},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.687245786190033},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.546583354473114},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5118700861930847},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4803958237171173},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4795638918876648},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47330036759376526},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.45487532019615173},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.42750269174575806},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.42515626549720764},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3203049302101135},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.22228622436523438},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2019.2916550","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2916550","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08713989.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:47741b82a5a246eaa6b67b07fff9c3a1","is_oa":true,"landing_page_url":"https://doaj.org/article/47741b82a5a246eaa6b67b07fff9c3a1","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 7, Pp 64788-64797 (2019)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2019.2916550","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2916550","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08713989.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6833731009","display_name":null,"funder_award_id":"2018ZX03001001","funder_id":"https://openalex.org/F4320323970","funder_display_name":"Ministry of Industry and Information Technology of the People's Republic of China"}],"funders":[{"id":"https://openalex.org/F4320323970","display_name":"Ministry of Industry and Information Technology of the People's Republic of China","ror":"https://ror.org/0385nmy68"},{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2946408574.pdf","grobid_xml":"https://content.openalex.org/works/W2946408574.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1598866093","https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W2018162709","https://openalex.org/W2060393849","https://openalex.org/W2097117768","https://openalex.org/W2112796928","https://openalex.org/W2155893237","https://openalex.org/W2163605009","https://openalex.org/W2186615578","https://openalex.org/W2194775991","https://openalex.org/W2442974303","https://openalex.org/W2585029434","https://openalex.org/W2592417500","https://openalex.org/W2619500264","https://openalex.org/W2752512710","https://openalex.org/W2766975872","https://openalex.org/W2788193959","https://openalex.org/W2949634898","https://openalex.org/W2953384591","https://openalex.org/W2962747323","https://openalex.org/W2963340555","https://openalex.org/W2963674387","https://openalex.org/W2963918968","https://openalex.org/W2964324519","https://openalex.org/W4250981202","https://openalex.org/W4297699616","https://openalex.org/W4302296459","https://openalex.org/W6665801690","https://openalex.org/W6684191040","https://openalex.org/W6713134421","https://openalex.org/W6743955621","https://openalex.org/W6744307745","https://openalex.org/W6764199483"],"related_works":["https://openalex.org/W3062287","https://openalex.org/W2380390332","https://openalex.org/W2742145873","https://openalex.org/W4245975140","https://openalex.org/W4312417841","https://openalex.org/W3193565141","https://openalex.org/W3133861977","https://openalex.org/W3167935049","https://openalex.org/W3029198973","https://openalex.org/W4390846322"],"abstract_inverted_index":{"Neural":[0],"networks,":[1],"as":[2],"powerful":[3],"models":[4,46],"for":[5,59,92,223],"many":[6],"difficult":[7],"learning":[8],"tasks,":[9],"have":[10,47],"created":[11],"an":[12,220],"increasingly":[13],"heavy":[14],"computational":[15],"burden.":[16],"More":[17],"and":[18,29,54,76,108,118,141,157,167,189,209],"more":[19],"researchers":[20],"focus":[21],"on":[22,97,101,182],"how":[23],"to":[24,35,87,138,148],"optimize":[25],"the":[26,32,44,89,102,116,164,199,211],"training":[27,90,125,172],"time,":[28],"one":[30],"of":[31,70,104,171,185],"difficulties":[33],"is":[34,56,66,73,180,205],"establish":[36],"a":[37,74,85],"general":[38],"iteration":[39],"time":[40,91,173],"prediction":[41,62,121,165],"model.":[42],"However,":[43],"existing":[45],"high":[48],"complexity":[49],"or":[50,126],"tedious":[51],"build":[52],"processes,":[53],"there":[55,65],"still":[57],"space":[58],"improvement":[60],"in":[61],"accuracy.":[63],"Moreover,":[64],"little":[67],"systematic":[68],"analysis":[69,103,169],"multi-GPU":[71,98],"which":[72,216],"special":[75,110],"widely":[77],"used":[78],"scenario.":[79],"In":[80],"this":[81],"paper,":[82],"we":[83,144,162],"introduce":[84],"framework":[86,114],"analyze":[88],"convolutional":[93],"neural":[94],"networks":[95],"(CNNs)":[96],"platforms.":[99],"Based":[100],"GPU":[105,153,187],"calculation":[106],"principles":[107],"its":[109],"transmission":[111],"mode,":[112],"our":[113,218],"decomposes":[115],"model":[117,166,179,219],"obtain":[119],"accurate":[120],"results":[122,170,196,213],"without":[123],"long-term":[124],"complex":[127],"data":[128],"collection.":[129],"We":[130],"start":[131],"by":[132,214],"extracting":[133],"key":[134],"feature":[135],"parameters":[136],"related":[137],"GPUs,":[139],"CNNs,":[140],"networks.":[142],"Then,":[143],"map":[145],"CNN":[146,192],"architectures":[147],"constraints,":[149],"including":[150],"software":[151],"platforms,":[152,154],"parallel":[155],"strategies,":[156],"communication":[158],"strategies.":[159],"At":[160],"last,":[161],"provide":[163],"give":[168],"from":[174],"multiple":[175],"perspectives.":[176],"The":[177,194],"proposed":[178],"verified":[181],"four":[183],"types":[184],"NVIDIA":[186],"platforms":[188],"six":[190],"different":[191],"architectures.":[193],"experiment":[195],"show":[197],"that":[198],"average":[200],"error":[201],"across":[202],"varies":[203],"scenarios":[204],"less":[206],"than":[207],"15%":[208],"outperform":[210],"state-of-the-art":[212],"5%-30%,":[215],"corroborate":[217],"effective":[221],"tool":[222],"artificial":[224],"intelligence":[225],"(AI)":[226],"researchers.":[227]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
