{"id":"https://openalex.org/W4407357390","doi":"https://doi.org/10.1145/3709738","title":"DiskGNN: Bridging I/O Efficiency and Model Accuracy for Out-of-Core GNN Training","display_name":"DiskGNN: Bridging I/O Efficiency and Model Accuracy for Out-of-Core GNN Training","publication_year":2025,"publication_date":"2025-02-10","ids":{"openalex":"https://openalex.org/W4407357390","doi":"https://doi.org/10.1145/3709738"},"language":"en","primary_location":{"id":"doi:10.1145/3709738","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3709738","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038657520","display_name":"Renjie Liu","orcid":"https://orcid.org/0009-0007-4332-2762"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Renjie Liu","raw_affiliation_strings":["Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0007-4332-2762","affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031704840","display_name":"Y Z Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yichuan Wang","raw_affiliation_strings":["UC Berkeley, Berkeley, USA"],"raw_orcid":"https://orcid.org/0009-0007-3714-9326","affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100367774","display_name":"Xiao Yan","orcid":"https://orcid.org/0000-0002-2122-915X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao Yan","raw_affiliation_strings":["Centre for Perceptual and Interactive Intelligence, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0002-2122-915X","affiliations":[{"raw_affiliation_string":"Centre for Perceptual and Interactive Intelligence, Hong Kong, Hong Kong","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102663229","display_name":"Haitian Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haitian Jiang","raw_affiliation_strings":["New York University, New York, USA"],"raw_orcid":"https://orcid.org/0009-0009-0350-1058","affiliations":[{"raw_affiliation_string":"New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000220537","display_name":"Zhenkun Cai","orcid":"https://orcid.org/0000-0002-0199-4866"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhenkun Cai","raw_affiliation_strings":["Amazon, Santa Clara, USA"],"raw_orcid":"https://orcid.org/0000-0002-0199-4866","affiliations":[{"raw_affiliation_string":"Amazon, Santa Clara, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057909000","display_name":"Minjie Wang","orcid":"https://orcid.org/0009-0009-8156-1179"},"institutions":[{"id":"https://openalex.org/I3132425485","display_name":"Shanghai American School","ror":"https://ror.org/03xzda142","country_code":"CN","type":"education","lineage":["https://openalex.org/I3132425485"]},{"id":"https://openalex.org/I4391012619","display_name":"Shanghai Artificial Intelligence Laboratory","ror":"https://ror.org/03wkvpx79","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391012619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minjie Wang","raw_affiliation_strings":["AWS Shanghai AI Lab, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0009-8156-1179","affiliations":[{"raw_affiliation_string":"AWS Shanghai AI Lab, Shanghai, China","institution_ids":["https://openalex.org/I3132425485","https://openalex.org/I4391012619"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101455930","display_name":"Bo Tang","orcid":"https://orcid.org/0000-0001-8424-0092"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Tang","raw_affiliation_strings":["Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-8424-0092","affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073978798","display_name":"Jinyang Li","orcid":"https://orcid.org/0000-0002-9574-1746"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jinyang Li","raw_affiliation_strings":["New York University, New York, USA"],"raw_orcid":"https://orcid.org/0000-0002-9574-1746","affiliations":[{"raw_affiliation_string":"New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5038657520"],"corresponding_institution_ids":["https://openalex.org/I3045169105"],"apc_list":null,"apc_paid":null,"fwci":12.9278,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.98437018,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"3","issue":"1","first_page":"1","last_page":"27"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.9008567929267883},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.5656862854957581},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4785745441913605},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4587751626968384},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.11474007368087769},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.051915258169174194}],"concepts":[{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.9008567929267883},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.5656862854957581},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4785745441913605},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4587751626968384},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.11474007368087769},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.051915258169174194},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3709738","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3709738","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2068739275","https://openalex.org/W2070232376","https://openalex.org/W2893230400","https://openalex.org/W2963601856","https://openalex.org/W2964236544","https://openalex.org/W3009901425","https://openalex.org/W3099064659","https://openalex.org/W3123329971","https://openalex.org/W3159109662","https://openalex.org/W3167523712","https://openalex.org/W4220807331","https://openalex.org/W4221106024","https://openalex.org/W4321466207","https://openalex.org/W4387321131","https://openalex.org/W4399174525"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4388870064","https://openalex.org/W2210139803","https://openalex.org/W4235186151","https://openalex.org/W2054685365","https://openalex.org/W2056057048","https://openalex.org/W2667588871","https://openalex.org/W2272354214"],"abstract_inverted_index":{"Graph":[0],"neural":[1],"networks":[2],"(GNNs)":[3],"are":[4,55],"models":[5],"specialized":[6],"for":[7,51,79,112,145],"graph":[8,68,99,109],"data":[9,32],"and":[10,35,83,127,172,179,191],"widely":[11],"used":[12],"in":[13],"applications.":[14],"To":[15,72],"train":[16],"GNNs":[17],"on":[18,33,139],"large":[19],"graphs":[20],"that":[21,54,120,213],"exceed":[22],"CPU":[23,173],"memory,":[24],"several":[25],"systems":[26,41,222],"have":[27],"been":[28],"designed":[29],"to":[30,130,141,164,174,185,194],"store":[31,163],"disk":[34,59,140,181,196],"conduct":[36],"out-of-core":[37,206],"processing.":[38],"However,":[39],"these":[40],"suffer":[42],"from":[43,101],"either":[44],"read":[45,143],"amplification":[46,144],"when":[47],"conducting":[48,108],"random":[49],"reads":[50],"node":[52,118,133,177],"features":[53,119,134,178],"smaller":[56],"than":[57,217],"a":[58],"page,":[60],"or":[61],"degraded":[62],"model":[63,87,102,125,227],"accuracy":[64,88],"by":[65,107,153],"treating":[66],"the":[67,117,132,148,167],"as":[69],"disconnected":[70],"partitions.":[71],"close":[73],"this":[74],"gap,":[75],"we":[76],"build":[77],"DiskGNN":[78,115,156,203,214,229],"high":[80],"I/O":[81],"efficiency":[82],"fast":[84],"training":[85,193,208],"without":[86],"degradation.":[89],"The":[90,210],"key":[91],"technique":[92],"is":[93,230],"offline":[94,154],"sampling":[95,100,110],",":[96],"which":[97],"decouples":[98],"computation":[103,126],".":[104],"In":[105],"particular,":[106],"beforehand":[111],"multiple":[113],"mini-batches,":[114],"acquires":[116],"will":[121],"be":[122],"accessed":[123],"during":[124,189],"conducts":[128],"pre-processing":[129],"pack":[131],"of":[135,170],"each":[136],"mini-batch":[137],"contiguously":[138],"avoid":[142],"computation.":[146],"Given":[147],"feature":[149,162,187],"access":[150,197],"information":[151],"acquired":[152],"sampling,":[155],"also":[157],"adopts":[158],"designs":[159],"including":[160],"four-level":[161],"fully":[165],"utilize":[166],"memory":[168],"hierarchy":[169],"GPU":[171],"cache":[175],"hot":[176],"reduce":[180],"access,":[182],"batched":[183],"packing":[184,188],"accelerate":[186],"pre-processing,":[190],"pipelined":[192],"overlap":[195],"with":[198,204],"other":[199],"operations.":[200],"We":[201],"compare":[202],"state-of-the-art":[205],"GNN":[207],"systems.":[209],"results":[211],"show":[212],"has":[215],"more":[216],"8x":[218],"speedup":[219],"over":[220],"existing":[221],"while":[223],"matching":[224],"their":[225],"best":[226],"accuracy.":[228],"open-source":[231],"at":[232],"https://github.com/Liu-rj/DiskGNN.":[233]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
