{"id":"https://openalex.org/W2971709192","doi":"https://doi.org/10.1109/hpec.2019.8916498","title":"Accelerating DNN Inference with GraphBLAS and the GPU","display_name":"Accelerating DNN Inference with GraphBLAS and the GPU","publication_year":2019,"publication_date":"2019-09-01","ids":{"openalex":"https://openalex.org/W2971709192","doi":"https://doi.org/10.1109/hpec.2019.8916498","mag":"2971709192"},"language":"en","primary_location":{"id":"doi:10.1109/hpec.2019.8916498","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec.2019.8916498","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE High Performance Extreme Computing Conference (HPEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://escholarship.org/content/qt1fg335kd/qt1fg335kd.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100447919","display_name":"Xiaoyun Wang","orcid":"https://orcid.org/0000-0002-7846-269X"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiaoyun Wang","raw_affiliation_strings":["Department of Computer Science, University of California, Davis, Davis, California"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of California, Davis, Davis, California","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082748769","display_name":"Zhongyi Lin","orcid":"https://orcid.org/0000-0002-5992-3913"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhongyi Lin","raw_affiliation_strings":["Department of Electrical & Computer Engineering, University of California, Davis, Davis, California"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering, University of California, Davis, Davis, California","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006897094","display_name":"Carl Yang","orcid":"https://orcid.org/0000-0001-9145-4531"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Carl Yang","raw_affiliation_strings":["Department of Electrical & Computer Engineering, University of California, Davis, Davis, California"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering, University of California, Davis, Davis, California","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028662746","display_name":"John D. Owens","orcid":"https://orcid.org/0000-0001-6582-8237"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John D. Owens","raw_affiliation_strings":["Department of Electrical & Computer Engineering, University of California, Davis, Davis, California"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering, University of California, Davis, Davis, California","institution_ids":["https://openalex.org/I84218800"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100447919"],"corresponding_institution_ids":["https://openalex.org/I84218800"],"apc_list":null,"apc_paid":null,"fwci":1.1559,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.84506135,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7446683049201965},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6658785343170166},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.47263047099113464},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.45118409395217896},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38551270961761475},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3352035880088806},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.128745436668396}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7446683049201965},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6658785343170166},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.47263047099113464},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.45118409395217896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38551270961761475},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3352035880088806},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.128745436668396}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/hpec.2019.8916498","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec.2019.8916498","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE High Performance Extreme Computing Conference (HPEC)","raw_type":"proceedings-article"},{"id":"pmh:oai:escholarship.org/ark:/13030/qt1fg335kd","is_oa":true,"landing_page_url":"https://escholarship.org/uc/item/1fg335kd","pdf_url":"https://escholarship.org/content/qt1fg335kd/qt1fg335kd.pdf","source":{"id":"https://openalex.org/S4306400115","display_name":"eScholarship (California Digital Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2801248553","host_organization_name":"California Digital Library","host_organization_lineage":["https://openalex.org/I2801248553"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:escholarship.org/ark:/13030/qt1fg335kd","is_oa":true,"landing_page_url":"https://escholarship.org/uc/item/1fg335kd","pdf_url":"https://escholarship.org/content/qt1fg335kd/qt1fg335kd.pdf","source":{"id":"https://openalex.org/S4306400115","display_name":"eScholarship (California Digital Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2801248553","host_organization_name":"California Digital Library","host_organization_lineage":["https://openalex.org/I2801248553"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"},"sustainable_development_goals":[{"score":0.41999998688697815,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2971709192.pdf","grobid_xml":"https://content.openalex.org/works/W2971709192.grobid-xml"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W2089437293","https://openalex.org/W2095249664","https://openalex.org/W2146292423","https://openalex.org/W2461193710","https://openalex.org/W2743799610","https://openalex.org/W2751658790","https://openalex.org/W2762661956","https://openalex.org/W2785452945","https://openalex.org/W2811247723","https://openalex.org/W2883830791","https://openalex.org/W2965423625","https://openalex.org/W2995872593","https://openalex.org/W3098650335","https://openalex.org/W3099786550","https://openalex.org/W3101104221","https://openalex.org/W4294761111"],"related_works":["https://openalex.org/W2306641587","https://openalex.org/W2137218050","https://openalex.org/W2982613029","https://openalex.org/W1997955449","https://openalex.org/W2080914619","https://openalex.org/W3045822024","https://openalex.org/W4251483198","https://openalex.org/W2073045545","https://openalex.org/W3214851784","https://openalex.org/W4250047567"],"abstract_inverted_index":{"This":[0],"work":[1],"addresses":[2],"the":[3,18,35,46,58,65],"2019":[4],"Sparse":[5],"Deep":[6],"Neural":[7],"Network":[8],"Graph":[9],"Challenge":[10],"with":[11,29],"an":[12],"implementation":[13,33,44,50],"of":[14],"this":[15,27],"challenge":[16,28],"using":[17],"GraphBLAS":[19,32,43],"programming":[20],"model.":[21],"We":[22],"demonstrate":[23],"our":[24],"solution":[25],"to":[26,40,61],"GraphBLAST,":[30],"a":[31,42,68],"on":[34,45,64],"GPU,":[36],"and":[37],"compare":[38],"it":[39],"SuiteSparse,":[41],"CPU.":[47],"The":[48],"GraphBLAST":[49],"is":[51,67],"$1.94":[52],"\\times":[53],"$":[54],"faster":[55],"than":[56],"Suite-Sparse;":[57],"primary":[59],"opportunity":[60],"increase":[62],"performance":[63],"GPU":[66],"higher-performance":[69],"sparse-matrix-times-sparse-matrix":[70],"(SpGEMM)":[71],"kernel.":[72]},"counts_by_year":[{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":4}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
