{"id":"https://openalex.org/W4377231507","doi":"https://doi.org/10.1109/tc.2023.3278530","title":"Waterwave: A GPU Memory Flow Engine for Concurrent DNN Training","display_name":"Waterwave: A GPU Memory Flow Engine for Concurrent DNN Training","publication_year":2023,"publication_date":"2023-05-22","ids":{"openalex":"https://openalex.org/W4377231507","doi":"https://doi.org/10.1109/tc.2023.3278530"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2023.3278530","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tc.2023.3278530","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016486553","display_name":"Xuanhua Shi","orcid":"https://orcid.org/0000-0001-8451-8656"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuanhua Shi","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101793348","display_name":"Xuan Peng","orcid":"https://orcid.org/0009-0000-6885-1168"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Peng","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064596191","display_name":"Ligang He","orcid":"https://orcid.org/0000-0002-5671-0576"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ligang He","raw_affiliation_strings":["University of Warwick, Coventry, U.K"],"affiliations":[{"raw_affiliation_string":"University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101584327","display_name":"Yunfei Zhao","orcid":"https://orcid.org/0009-0002-7929-8825"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunfei Zhao","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022262922","display_name":"Hai Jin","orcid":"https://orcid.org/0000-0002-3934-7605"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hai Jin","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5016486553"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":0.369,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.58107445,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"72","issue":"10","first_page":"2938","last_page":"2950"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7219539880752563},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5239080190658569},{"id":"https://openalex.org/keywords/allocator","display_name":"Allocator","score":0.5016365051269531},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3703381419181824}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7219539880752563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5239080190658569},{"id":"https://openalex.org/C162262903","wikidata":"https://www.wikidata.org/wiki/Q343527","display_name":"Allocator","level":2,"score":0.5016365051269531},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3703381419181824}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tc.2023.3278530","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tc.2023.3278530","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},{"id":"pmh:oai:wrap.warwick.ac.uk:176103","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306400665","display_name":"Warwick Research Archive Portal (University of Warwick)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I39555362","host_organization_name":"University of Warwick","host_organization_lineage":["https://openalex.org/I39555362"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2097998348","https://openalex.org/W2113207845","https://openalex.org/W2133796939","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2489529491","https://openalex.org/W2525778437","https://openalex.org/W2553303224","https://openalex.org/W2556522401","https://openalex.org/W2606722458","https://openalex.org/W2772678505","https://openalex.org/W2788853733","https://openalex.org/W2883283076","https://openalex.org/W2893114493","https://openalex.org/W2896457183","https://openalex.org/W2899071864","https://openalex.org/W2899771611","https://openalex.org/W2953384591","https://openalex.org/W2962821792","https://openalex.org/W2964081807","https://openalex.org/W2964243274","https://openalex.org/W2969388332","https://openalex.org/W2973727699","https://openalex.org/W2991040477","https://openalex.org/W3012479151","https://openalex.org/W3012514909","https://openalex.org/W3096956001","https://openalex.org/W3138303811","https://openalex.org/W3138327474","https://openalex.org/W3175161462","https://openalex.org/W3182301081","https://openalex.org/W4200282803","https://openalex.org/W4247353671","https://openalex.org/W4288289123","https://openalex.org/W4289244325","https://openalex.org/W4292779060","https://openalex.org/W6631190155","https://openalex.org/W6674385629","https://openalex.org/W6677088747","https://openalex.org/W6713134421","https://openalex.org/W6727690538","https://openalex.org/W6729956949","https://openalex.org/W6730169791","https://openalex.org/W6741414320","https://openalex.org/W6748587240","https://openalex.org/W6755207826","https://openalex.org/W6756009870","https://openalex.org/W6756040250","https://openalex.org/W6756285791","https://openalex.org/W6756718674","https://openalex.org/W6767997687","https://openalex.org/W6769424276","https://openalex.org/W6778883912","https://openalex.org/W6780671031","https://openalex.org/W6784871562","https://openalex.org/W6791891499","https://openalex.org/W6797242466","https://openalex.org/W6799023841"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4252124899","https://openalex.org/W4250204977","https://openalex.org/W2043640140","https://openalex.org/W2122690624","https://openalex.org/W4361194010","https://openalex.org/W4312676584","https://openalex.org/W4376862083","https://openalex.org/W2016931788"],"abstract_inverted_index":{"Training":[0],"Deep":[1],"Neural":[2],"Networks":[3],"(DNN)":[4],"concurrently":[5],"is":[6,31,110],"becoming":[7],"increasingly":[8],"important":[9],"for":[10,66,94],"deep":[11,68],"learning":[12,69],"practitioners,":[13],"e.g.,":[14],"<italic":[15,21,58,106,116,140,152,161,173,196],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[16,22,59,107,117,141,153,162,174,197],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">hyperparameter":[17],"optimization":[18],"(HPO)</i>":[19],"and":[20,86,156,204,211],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">neural":[23],"architecture":[24],"search":[25],"(NAS)</i>.":[26],"The":[27],"GPU":[28,44,62,137],"memory":[29,49,63,75,84,125,170,194],"capacity":[30],"the":[32,42,47,74,79,98,102,114,144,182],"impediment":[33],"that":[34],"prohibits":[35],"multiple":[36],"DNNs":[37],"from":[38],"being":[39],"trained":[40],"on":[41,113],"same":[43],"due":[45],"to":[46,72,122,132,147,166,179,209],"large":[48],"usage":[50],"during":[51],"training.":[52,70,188],"In":[53],"this":[54],"paper,":[55],"we":[56,89],"propose":[57],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Waterwave</i>,":[60],"a":[61,105,148,168],"flow":[64],"engine":[65],"concurrent":[67],"First,":[71],"address":[73],"explosion":[76],"brought":[77],"by":[78,207],"long":[80],"time":[81],"lag":[82],"between":[83],"allocation":[85],"deallocation":[87],"time,":[88],"develop":[90],"an":[91],"allocator":[92,99],"tailored":[93],"multi-streams.":[95],"By":[96],"making":[97],"aware":[100],"of":[101,150,181,186],"stream":[103],"information,":[104],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">prioritized":[108],"allocation</i>":[109],"conducted":[111],"based":[112],"chunk's":[115],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">synchronization</i>":[118],"attributes,":[119],"allowing":[120],"us":[121],"provide":[123],"useable":[124],"after":[126,136],"scheduling":[127],"rather":[128],"than":[129],"waiting":[130],"it":[131],"be":[133],"really":[134],"released":[135],"computation.":[138],"Second,":[139],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Waterwave</i>":[142,175,198],"partitions":[143],"compute":[145],"graph":[146],"set":[149],"continuous":[151],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">node":[154],"groups</i>":[155],"then":[157],"performs":[158],"finer-grained":[159],"scheduling:":[160],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">NodeGroup":[163],"pipeline":[164],"execution</i>,":[165],"guarantee":[167],"proper":[169],"requests":[171],"order.":[172],"can":[176,199],"accomplish":[177],"up":[178,208],"96.8%":[180],"maximum":[183],"batch":[184],"size":[185],"solo":[187],"Additionally,":[189],"in":[190],"scenarios":[191],"with":[192],"high":[193],"demand,":[195],"outperform":[200],"existing":[201],"spatial":[202],"sharing":[203,206],"temporal":[205],"12x":[210],"1.49x,":[212],"respectively.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-21T23:12:01.093139","created_date":"2025-10-10T00:00:00"}
