{"id":"https://openalex.org/W3189259198","doi":"https://doi.org/10.1109/tpds.2022.3219819","title":"Parallel Training of Pre-Trained Models via Chunk-Based Dynamic Memory Management","display_name":"Parallel Training of Pre-Trained Models via Chunk-Based Dynamic Memory Management","publication_year":2022,"publication_date":"2022-11-07","ids":{"openalex":"https://openalex.org/W3189259198","doi":"https://doi.org/10.1109/tpds.2022.3219819","mag":"3189259198"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2022.3219819","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3219819","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2108.05818","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069911612","display_name":"Jiarui Fang","orcid":"https://orcid.org/0000-0002-6724-2763"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiarui Fang","raw_affiliation_strings":["Tencent Inc., Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-6724-2763","affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108726790","display_name":"Zilin Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zilin Zhu","raw_affiliation_strings":["Tencent Inc., Shenzhen, Guangdong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052416030","display_name":"Shenggui Li","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shenggui Li","raw_affiliation_strings":["National Singapore University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Singapore University, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064445567","display_name":"Hui Su","orcid":"https://orcid.org/0000-0003-0340-1128"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Su","raw_affiliation_strings":["Tencent Inc., Shenzhen, Guangdong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111336367","display_name":"Yang Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Yu","raw_affiliation_strings":["Tencent Inc., Shenzhen, Guangdong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024102664","display_name":"Jie Zhou","orcid":"https://orcid.org/0000-0002-3371-6780"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Zhou","raw_affiliation_strings":["Tencent Inc., Shenzhen, Guangdong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100658705","display_name":"Yang You","orcid":"https://orcid.org/0000-0003-2816-4384"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yang You","raw_affiliation_strings":["National Singapore University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Singapore University, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5069911612"],"corresponding_institution_ids":["https://openalex.org/I2250653659"],"apc_list":null,"apc_paid":null,"fwci":2.943,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.92214946,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"34","issue":"1","first_page":"304","last_page":"315"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8971927165985107},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5373875498771667},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.4559406340122223},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.44164949655532837},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.4381803274154663},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.42393866181373596},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4215662479400635},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.22730746865272522},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.20059484243392944},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1349402666091919},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.10663145780563354},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.09466612339019775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8971927165985107},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5373875498771667},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.4559406340122223},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.44164949655532837},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.4381803274154663},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.42393866181373596},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4215662479400635},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.22730746865272522},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.20059484243392944},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1349402666091919},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.10663145780563354},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.09466612339019775},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpds.2022.3219819","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3219819","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2108.05818","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.05818","pdf_url":"https://arxiv.org/pdf/2108.05818","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2108.05818","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.05818","pdf_url":"https://arxiv.org/pdf/2108.05818","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1963831729","https://openalex.org/W1976316975","https://openalex.org/W1987225815","https://openalex.org/W2131613942","https://openalex.org/W2164705534","https://openalex.org/W2168231600","https://openalex.org/W2338908902","https://openalex.org/W2489529491","https://openalex.org/W2763421725","https://openalex.org/W2896457183","https://openalex.org/W2899771611","https://openalex.org/W2900096133","https://openalex.org/W2926767350","https://openalex.org/W2955715866","https://openalex.org/W2962776038","https://openalex.org/W2963341956","https://openalex.org/W2963351145","https://openalex.org/W2963403868","https://openalex.org/W2964174152","https://openalex.org/W2969388332","https://openalex.org/W2970971581","https://openalex.org/W2971843695","https://openalex.org/W2973727699","https://openalex.org/W2979044977","https://openalex.org/W2981237538","https://openalex.org/W2990896553","https://openalex.org/W2991040477","https://openalex.org/W3006131567","https://openalex.org/W3012514909","https://openalex.org/W3030163527","https://openalex.org/W3035078899","https://openalex.org/W3086105743","https://openalex.org/W3094502228","https://openalex.org/W3101708369","https://openalex.org/W3129831491","https://openalex.org/W3130395060","https://openalex.org/W3130716829","https://openalex.org/W3156643189","https://openalex.org/W3159351344","https://openalex.org/W3164253193","https://openalex.org/W3166243953","https://openalex.org/W3167220634","https://openalex.org/W3174394143","https://openalex.org/W3204105967","https://openalex.org/W3205803342","https://openalex.org/W3209444800","https://openalex.org/W4292779060","https://openalex.org/W4293404878","https://openalex.org/W4295312788","https://openalex.org/W4385245566","https://openalex.org/W6684859321","https://openalex.org/W6703652217","https://openalex.org/W6717768942","https://openalex.org/W6739901393","https://openalex.org/W6745245109","https://openalex.org/W6755207826","https://openalex.org/W6756379755","https://openalex.org/W6756718674","https://openalex.org/W6765438313","https://openalex.org/W6766978945","https://openalex.org/W6767997687","https://openalex.org/W6774125022","https://openalex.org/W6778883912","https://openalex.org/W6784333009","https://openalex.org/W6787953186","https://openalex.org/W6790665546","https://openalex.org/W6802310216","https://openalex.org/W6843113163","https://openalex.org/W6856795522"],"related_works":["https://openalex.org/W2122678784","https://openalex.org/W1495042958","https://openalex.org/W2282510344","https://openalex.org/W2183994405","https://openalex.org/W4234013965","https://openalex.org/W2349023125","https://openalex.org/W1872497593","https://openalex.org/W2171409224","https://openalex.org/W1976807322","https://openalex.org/W2056396287"],"abstract_inverted_index":{"The":[0,123],"pre-trained":[1],"model":[2,58,67,148],"(PTM)":[3],"is":[4,17,178],"revolutionizing":[5],"Artificial":[6],"Intelligence":[7],"(AI)":[8],"technology.":[9],"However,":[10],"the":[11,37,50,57,66,77,82,111,166],"hardware":[12,38],"requirement":[13],"of":[14,28,40,154],"PTM":[15],"training":[16,169],"prohibitively":[18],"high,":[19],"making":[20],"it":[21],"a":[22,25,88,172],"game":[23],"for":[24],"small":[26],"proportion":[27],"people.":[29],"Therefore,":[30],"we":[31,64],"proposed":[32],"PatrickStar":[33,48,115,146],"system":[34,124],"to":[35,46,55,117],"lower":[36,100],"requirements":[39],"PTMs":[41],"and":[42,72,98,105,131,151,156],"make":[43],"them":[44,75],"accessible":[45],"everyone.":[47],"uses":[49],"CPU-GPU":[51,101],"heterogeneous":[52,78,96],"memory":[53,70,84,97],"space":[54],"store":[56],"data.":[59],"Different":[60],"from":[61],"existing":[62,140],"works,":[63],"organize":[65],"data":[68,102],"in":[69,76,87,95],"chunks":[71,91],"dynamically":[73],"distribute":[74],"memory.":[79],"Guided":[80],"by":[81,139],"runtime":[83],"statistics":[85],"collected":[86],"warm-up":[89],"iteration,":[90],"are":[92],"orchestrated":[93],"efficiently":[94],"generate":[99],"transmission":[103],"volume":[104],"higher":[106,159],"bandwidth":[107],"utilization.":[108],"Symbiosis":[109],"with":[110],"Zero":[112],"Redundancy":[113],"Optimizer,":[114],"scales":[116,149],"multiple":[118,121],"GPUs":[119],"on":[120,128,171],"nodes.":[122],"can":[125],"train":[126],"tasks":[127],"bigger":[129],"models":[130],"larger":[132],"batch":[133],"sizes,":[134],"which":[135],"cannot":[136],"be":[137],"accomplished":[138],"works.":[141],"Experimental":[142],"results":[143],"show":[144],"that":[145],"extends":[147],"2.27":[150],"2.5":[152],"times":[153],"DeepSpeed,":[155],"exhibits":[157],"significantly":[158],"execution":[160],"speed.":[161],"PatricStar":[162],"also":[163],"successfully":[164],"runs":[165],"175B":[167],"GPT3":[168],"task":[170],"32":[173],"GPU":[174],"cluster.":[175],"Our":[176],"code":[177],"available":[179],"at":[180],"<uri":[181],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[182],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/Tencent/PatrickStar</uri>":[183],".":[184]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":11}],"updated_date":"2026-05-28T09:10:13.091523","created_date":"2021-08-16T00:00:00"}
