{"id":"https://openalex.org/W3139142452","doi":"https://doi.org/10.1109/cgo51591.2021.9370326","title":"Efficient Execution of Graph Algorithms on CPU with SIMD Extensions","display_name":"Efficient Execution of Graph Algorithms on CPU with SIMD Extensions","publication_year":2021,"publication_date":"2021-02-27","ids":{"openalex":"https://openalex.org/W3139142452","doi":"https://doi.org/10.1109/cgo51591.2021.9370326","mag":"3139142452"},"language":"en","primary_location":{"id":"doi:10.1109/cgo51591.2021.9370326","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo51591.2021.9370326","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/ACM International Symposium on Code Generation and Optimization (CGO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.4279811","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049128051","display_name":"Ruohuang Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ruohuang Zheng","raw_affiliation_strings":["University of Rochester,Department of Computer Science,Rochester,New York,USA"],"affiliations":[{"raw_affiliation_string":"University of Rochester,Department of Computer Science,Rochester,New York,USA","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006053754","display_name":"Sreepathi Pai","orcid":"https://orcid.org/0000-0002-3691-7238"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sreepathi Pai","raw_affiliation_strings":["University of Rochester,Department of Computer Science,Rochester,New York,USA"],"affiliations":[{"raw_affiliation_string":"University of Rochester,Department of Computer Science,Rochester,New York,USA","institution_ids":["https://openalex.org/I5388228"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5049128051"],"corresponding_institution_ids":["https://openalex.org/I5388228"],"apc_list":null,"apc_paid":null,"fwci":0.9692,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.76936038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"262","last_page":"276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9778000116348267,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.928770899772644},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.870149552822113},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7686119079589844},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6857684254646301},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5596854090690613},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5284735560417175},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5229713916778564},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.16818493604660034},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1190849244594574}],"concepts":[{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.928770899772644},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.870149552822113},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7686119079589844},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6857684254646301},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5596854090690613},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5284735560417175},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5229713916778564},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.16818493604660034},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1190849244594574}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cgo51591.2021.9370326","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo51591.2021.9370326","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/ACM International Symposium on Code Generation and Optimization (CGO)","raw_type":"proceedings-article"},{"id":"doi:10.5281/zenodo.4279811","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.4279811","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.5281/zenodo.4279811","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.4279811","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.550000011920929,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":82,"referenced_works":["https://openalex.org/W78077100","https://openalex.org/W1502558230","https://openalex.org/W1526813343","https://openalex.org/W1533802931","https://openalex.org/W1536852470","https://openalex.org/W1543897857","https://openalex.org/W1593868476","https://openalex.org/W1783256592","https://openalex.org/W1788180225","https://openalex.org/W1850405760","https://openalex.org/W1964876237","https://openalex.org/W1969970763","https://openalex.org/W1972663160","https://openalex.org/W1985291160","https://openalex.org/W1986647922","https://openalex.org/W1988888548","https://openalex.org/W2000041758","https://openalex.org/W2003168947","https://openalex.org/W2021211271","https://openalex.org/W2034102265","https://openalex.org/W2038497593","https://openalex.org/W2041470524","https://openalex.org/W2049487370","https://openalex.org/W2050487400","https://openalex.org/W2067479799","https://openalex.org/W2067635581","https://openalex.org/W2095223744","https://openalex.org/W2097717378","https://openalex.org/W2104329103","https://openalex.org/W2107173440","https://openalex.org/W2128653745","https://openalex.org/W2135063076","https://openalex.org/W2157427457","https://openalex.org/W2170616854","https://openalex.org/W2186129770","https://openalex.org/W2249320699","https://openalex.org/W2271498114","https://openalex.org/W2295258302","https://openalex.org/W2295329047","https://openalex.org/W2339410347","https://openalex.org/W2399032974","https://openalex.org/W2399701057","https://openalex.org/W2409247164","https://openalex.org/W2479334570","https://openalex.org/W2523378841","https://openalex.org/W2524623326","https://openalex.org/W2566870951","https://openalex.org/W2739409954","https://openalex.org/W2788443250","https://openalex.org/W2788981395","https://openalex.org/W2798525482","https://openalex.org/W2799267250","https://openalex.org/W2898231337","https://openalex.org/W2915012400","https://openalex.org/W2931071418","https://openalex.org/W2951113132","https://openalex.org/W2951135776","https://openalex.org/W2953944188","https://openalex.org/W2954219808","https://openalex.org/W2962740062","https://openalex.org/W2962865652","https://openalex.org/W2991447257","https://openalex.org/W3006582303","https://openalex.org/W3007195951","https://openalex.org/W3007641860","https://openalex.org/W3008451639","https://openalex.org/W3011163152","https://openalex.org/W3013652274","https://openalex.org/W3021182071","https://openalex.org/W3030829407","https://openalex.org/W3034302216","https://openalex.org/W3098245953","https://openalex.org/W3139142452","https://openalex.org/W4241140669","https://openalex.org/W4242887260","https://openalex.org/W4245643018","https://openalex.org/W4297789040","https://openalex.org/W6603201521","https://openalex.org/W6635451513","https://openalex.org/W6638233953","https://openalex.org/W6712590890","https://openalex.org/W6727469013"],"related_works":["https://openalex.org/W2778498407","https://openalex.org/W2317245370","https://openalex.org/W2099629705","https://openalex.org/W4249323025","https://openalex.org/W2111180768","https://openalex.org/W198851386","https://openalex.org/W2030310580","https://openalex.org/W947442053","https://openalex.org/W1980160788","https://openalex.org/W2148915962"],"abstract_inverted_index":{"Existing":[0],"state-of-the-art":[1,120],"CPU":[2,140,147],"graph":[3,26,33,44,121],"frameworks":[4],"take":[5],"advantage":[6],"of":[7],"multiple":[8],"cores,":[9],"but":[10,145],"not":[11],"the":[12,31,64,98,112,119,136,139,146],"SIMD":[13,37,75,100,115,131],"capability":[14],"within":[15],"each":[16],"core.":[17],"In":[18],"this":[19,48],"work,":[20],"we":[21],"retarget":[22],"an":[23,82],"existing":[24],"GPU":[25,142],"algorithm":[27],"compiler":[28,49],"to":[29,41,63,143],"obtain":[30],"first":[32],"framework":[34],"that":[35,69],"uses":[36],"extensions":[38],"on":[39,50,56,70,76,133],"CPUs":[40,59,134],"efficiently":[42],"execute":[43],"algorithms.":[45],"We":[46],"evaluate":[47],"10":[51,88],"benchmarks":[52,89],"and":[53,60,90,141],"3":[54,57,91],"graphs":[55,153],"different":[58],"also":[61,117],"compare":[62],"GPU.":[65],"Evaluation":[66],"results":[67],"show":[68],"a":[71,77,105],"8-core":[72],"machine,":[73],"enabling":[74],"naive":[78],"multi-core":[79,114],"implementation":[80,101,107],"achieves":[81],"additional":[83],"7.48x":[84],"speedup,":[85],"averaged":[86,126],"across":[87,127],"inputs.":[92],"Applying":[93],"our":[94],"SIMD-targeted":[95],"optimizations":[96],"improves":[97],"plain":[99],"by":[102,108,124],"1.67x,":[103],"outperforming":[104],"serial":[106],"12.46x.":[109],"On":[110],"average,":[111],"optimized":[113],"version":[116],"outperforms":[118],"framework,":[122],"GraphIt,":[123],"1.53x,":[125],"5":[128],"(common)":[129],"benchmarks.":[130],"execution":[132],"closes":[135],"gap":[137],"between":[138],"1.76x,":[144],"virtual":[148],"memory":[149],"performs":[150],"better":[151],"when":[152],"are":[154],"much":[155],"bigger":[156],"than":[157],"available":[158],"physical":[159],"memory.":[160]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4}],"updated_date":"2026-03-31T07:56:22.981413","created_date":"2025-10-10T00:00:00"}
