{"id":"https://openalex.org/W4381328689","doi":"https://doi.org/10.1145/3589311","title":"DUCATI: A Dual-Cache Training System for Graph Neural Networks on Giant Graphs with the GPU","display_name":"DUCATI: A Dual-Cache Training System for Graph Neural Networks on Giant Graphs with the GPU","publication_year":2023,"publication_date":"2023-06-13","ids":{"openalex":"https://openalex.org/W4381328689","doi":"https://doi.org/10.1145/3589311"},"language":"en","primary_location":{"id":"doi:10.1145/3589311","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3589311","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100327368","display_name":"Xin Zhang","orcid":"https://orcid.org/0000-0001-8560-5006"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Xin Zhang","raw_affiliation_strings":["The Hong Kong University of Science and Technology, Hong Kong SAR, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology, Hong Kong SAR, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053338416","display_name":"Yanyan Shen","orcid":"https://orcid.org/0000-0001-8364-3674"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanyan Shen","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014615052","display_name":"Yingxia Shao","orcid":"https://orcid.org/0000-0002-8559-2628"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingxia Shao","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100333516","display_name":"Lei Chen","orcid":"https://orcid.org/0000-0002-8257-5806"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei Chen","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100327368"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":4.6104,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.9607961,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"1","issue":"2","first_page":"1","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8769869804382324},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.7858253717422485},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7285804748535156},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6022052764892578},{"id":"https://openalex.org/keywords/cache-oblivious-algorithm","display_name":"Cache-oblivious algorithm","score":0.5626158714294434},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.523574709892273},{"id":"https://openalex.org/keywords/cache-coloring","display_name":"Cache coloring","score":0.46636733412742615},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.46597573161125183},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.4657469689846039},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.45585593581199646},{"id":"https://openalex.org/keywords/cache-pollution","display_name":"Cache pollution","score":0.4389810562133789},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.29108381271362305},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2122897505760193}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8769869804382324},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.7858253717422485},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7285804748535156},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6022052764892578},{"id":"https://openalex.org/C59687516","wikidata":"https://www.wikidata.org/wiki/Q5015938","display_name":"Cache-oblivious algorithm","level":5,"score":0.5626158714294434},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.523574709892273},{"id":"https://openalex.org/C201148951","wikidata":"https://www.wikidata.org/wiki/Q5015976","display_name":"Cache coloring","level":4,"score":0.46636733412742615},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.46597573161125183},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.4657469689846039},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.45585593581199646},{"id":"https://openalex.org/C113166858","wikidata":"https://www.wikidata.org/wiki/Q5015981","display_name":"Cache pollution","level":5,"score":0.4389810562133789},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.29108381271362305},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2122897505760193},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3589311","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3589311","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-148622","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-148622","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1994727615","https://openalex.org/W2101196063","https://openalex.org/W2296407087","https://openalex.org/W2914721378","https://openalex.org/W2926767350","https://openalex.org/W3096566397","https://openalex.org/W3101708369","https://openalex.org/W3159894882","https://openalex.org/W4220807331","https://openalex.org/W4233963176","https://openalex.org/W4288070868","https://openalex.org/W6600291067"],"related_works":["https://openalex.org/W2098406302","https://openalex.org/W2121191383","https://openalex.org/W2538519144","https://openalex.org/W2546991807","https://openalex.org/W1584415117","https://openalex.org/W2076114130","https://openalex.org/W1505654810","https://openalex.org/W4252570104","https://openalex.org/W2734782074","https://openalex.org/W2109265242"],"abstract_inverted_index":{"Recently":[0],"Graph":[1],"Neural":[2],"Networks":[3],"(GNNs)":[4],"have":[5,42],"achieved":[6],"great":[7],"success":[8],"in":[9,149],"many":[10],"applications.":[11],"The":[12,144,198],"mini-batch":[13,28,49,105],"training":[14,39,134,152,196],"has":[15],"become":[16],"the":[17,27,37,48,57,60,67,74,95,104,120,181,187],"de-facto":[18],"way":[19],"to":[20,46,55,77,88,94,101,158,167,171,180],"train":[21],"GNNs":[22],"on":[23,136,164,177,205],"giant":[24],"graphs.":[25],"However,":[26],"generation":[29,106],"task":[30],"is":[31],"extremely":[32],"expensive":[33],"which":[34,117],"slows":[35],"down":[36],"whole":[38],"process.":[40],"Researchers":[41],"proposed":[43],"several":[44],"solutions":[45],"accelerate":[47,103],"generation,":[50],"however,":[51],"they":[52],"(1)":[53],"fail":[54],"exploit":[56],"locality":[58],"of":[59,151,190],"adjacency":[61],"matrix,":[62],"(2)":[63],"cannot":[64],"fully":[65],"utilize":[66,109],"GPU":[68,110],"memory,":[69],"and":[70,107,169,192,212],"(3)":[71],"suffer":[72],"from":[73],"poor":[75],"adaptability":[76],"diverse":[78,141],"workloads.":[79],"In":[80,92],"this":[81],"work,":[82],"we":[83],"propose":[84],"DUCATI,":[85],"aDual-Cache":[86],"system":[87,206],"overcome":[89],"these":[90],"drawbacks.":[91],"addition":[93],"traditionalNfeat-Cache,":[96],"DUCATI":[97,112,130,154,191],"introduces":[98],"a":[99,114],"newAdj-Cache":[100],"further":[102],"better":[108],"memory.":[111],"develops":[113],"workload-awareDual-Cache":[115],"Allocator":[116],"adaptively":[118],"finds":[119],"best":[121],"cache":[122],"allocation":[123],"plan":[124],"under":[125,140],"different":[126,209],"settings.":[127,143],"We":[128,184],"compare":[129],"with":[131],"various":[132],"GNN":[133,195],"systems":[135],"four":[137,193],"billion-scale":[138],"graphs":[139],"workload":[142],"experimental":[145],"results":[146,200],"show":[147],"that":[148],"terms":[150],"time,":[153],"can":[155],"achieve":[156],"up":[157,170],"3.33":[159],"times":[160,163,173,176],"speedup":[161,174],"(2.07":[162],"average)":[165,178],"compared":[166,179],"DGL":[168],"1.54":[172],"(1.32":[175],"state-of-the-artSingle-Cache":[182],"systems.":[183,197],"also":[185],"analyze":[186],"time-accuracy":[188],"trade-offs":[189],"state-of-the-art":[194],"analysis":[199],"offer":[201],"users":[202],"some":[203],"guidelines":[204],"selection":[207],"regarding":[208],"input":[210],"sizes":[211],"hardware":[213],"resources.":[214]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":20},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-23T07:41:27.035349","created_date":"2025-10-10T00:00:00"}
