{"id":"https://openalex.org/W2895821746","doi":"https://doi.org/10.1109/access.2018.2876201","title":"Accelerating BFS via Data Structure-Aware Prefetching on GPU","display_name":"Accelerating BFS via Data Structure-Aware Prefetching on GPU","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2895821746","doi":"https://doi.org/10.1109/access.2018.2876201","mag":"2895821746"},"language":"en","primary_location":{"id":"doi:10.1109/access.2018.2876201","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2018.2876201","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2018.2876201","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101617974","display_name":"Hui Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hui Guo","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044840341","display_name":"Libo Huang","orcid":"https://orcid.org/0000-0001-7878-3998"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Libo Huang","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086487289","display_name":"Yashuai L\u00fc","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148107","display_name":"Space Engineering University","ror":"https://ror.org/04rj1td02","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210148107"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yashuai Lu","raw_affiliation_strings":["Space Engineering University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Space Engineering University, Beijing, China","institution_ids":["https://openalex.org/I4210148107"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009164671","display_name":"Jianqiao Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianqiao Ma","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100769507","display_name":"Cheng Qian","orcid":"https://orcid.org/0000-0002-1999-387X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Qian","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100760813","display_name":"Sheng Ma","orcid":"https://orcid.org/0000-0003-1710-4060"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sheng Ma","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047295889","display_name":"Zhiying Wang","orcid":"https://orcid.org/0000-0003-3339-3085"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiying Wang","raw_affiliation_strings":["1National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"1National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101617974"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.7574,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.70092887,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"6","issue":null,"first_page":"60234","last_page":"60248"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9062517881393433},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7327916622161865},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5519949793815613},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.5261461138725281},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.5127533674240112},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.5087419152259827},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5081930160522461},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.48366984724998474},{"id":"https://openalex.org/keywords/traverse","display_name":"Traverse","score":0.45683926343917847},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4377667009830475},{"id":"https://openalex.org/keywords/instruction-prefetch","display_name":"Instruction prefetch","score":0.418127179145813},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.4112907350063324},{"id":"https://openalex.org/keywords/cas-latency","display_name":"CAS latency","score":0.4105337858200073},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.23018789291381836},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.16474124789237976},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.15141448378562927}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9062517881393433},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7327916622161865},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5519949793815613},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.5261461138725281},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.5127533674240112},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.5087419152259827},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5081930160522461},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.48366984724998474},{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.45683926343917847},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4377667009830475},{"id":"https://openalex.org/C133588205","wikidata":"https://www.wikidata.org/wiki/Q28455645","display_name":"Instruction prefetch","level":3,"score":0.418127179145813},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.4112907350063324},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.4105337858200073},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.23018789291381836},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.16474124789237976},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.15141448378562927},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C100800780","wikidata":"https://www.wikidata.org/wiki/Q1175867","display_name":"Memory controller","level":3,"score":0.0},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2018.2876201","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2018.2876201","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:72747cd207e14dc8a25a142ed0ebf335","is_oa":true,"landing_page_url":"https://doaj.org/article/72747cd207e14dc8a25a142ed0ebf335","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 6, Pp 60234-60248 (2018)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2018.2876201","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2018.2876201","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.7799999713897705}],"awards":[{"id":"https://openalex.org/G2187338242","display_name":null,"funder_award_id":"61672526","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2341129714","display_name":null,"funder_award_id":"61472435","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3582114861","display_name":null,"funder_award_id":"61433019","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5419710353","display_name":null,"funder_award_id":"61572058","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8213023024","display_name":null,"funder_award_id":"61202129","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8838893027","display_name":null,"funder_award_id":"U14352217","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1975274780","https://openalex.org/W1979527452","https://openalex.org/W1983235612","https://openalex.org/W2009946006","https://openalex.org/W2023925637","https://openalex.org/W2027806965","https://openalex.org/W2050710108","https://openalex.org/W2056160756","https://openalex.org/W2065562952","https://openalex.org/W2093043622","https://openalex.org/W2099912705","https://openalex.org/W2102409597","https://openalex.org/W2103330947","https://openalex.org/W2107251158","https://openalex.org/W2125305952","https://openalex.org/W2129232868","https://openalex.org/W2142444503","https://openalex.org/W2143285027","https://openalex.org/W2152659795","https://openalex.org/W2153492376","https://openalex.org/W2159767828","https://openalex.org/W2165284728","https://openalex.org/W2166620913","https://openalex.org/W2166918318","https://openalex.org/W2168887341","https://openalex.org/W2169190816","https://openalex.org/W2170382128","https://openalex.org/W2315868086","https://openalex.org/W2333944373","https://openalex.org/W2518607193","https://openalex.org/W2537450429","https://openalex.org/W2755088640","https://openalex.org/W2769389493","https://openalex.org/W2785460572","https://openalex.org/W2789977517","https://openalex.org/W2790040252","https://openalex.org/W2886858179","https://openalex.org/W3030752614","https://openalex.org/W3138340923","https://openalex.org/W3204389768","https://openalex.org/W4231523139","https://openalex.org/W4234833047","https://openalex.org/W4235870392","https://openalex.org/W4237150160","https://openalex.org/W4249082578","https://openalex.org/W6792253866"],"related_works":["https://openalex.org/W2075500488","https://openalex.org/W1530597339","https://openalex.org/W2336226224","https://openalex.org/W134340165","https://openalex.org/W2068131691","https://openalex.org/W1557286738","https://openalex.org/W2546695182","https://openalex.org/W2101018784","https://openalex.org/W3113336200","https://openalex.org/W4360765372"],"abstract_inverted_index":{"Breadth":[0],"First":[1],"Search":[2],"(BFS)":[3],"is":[4],"a":[5,52,132,190,207,229],"key":[6],"graph":[7,12,23,38,123],"traversing":[8,39],"algorithm":[9],"for":[10,104,243],"many":[11,34],"analytics":[13,24],"applications.":[14,203],"In":[15,126],"recent":[16],"decades,":[17],"as":[18],"the":[19,22,45,56,61,73,80,84,118,122,144,162,165,171,180,183,250,254,258,269],"scale":[20],"of":[21,50,55,63,82,121,150,164,182,202,212,220],"problem":[25],"has":[26,32],"become":[27],"larger":[28],"and":[29,175,193,257,264],"larger,":[30],"it":[31],"raised":[33],"interests":[35],"to":[36,44,78,110,160,169,215,252,266],"accelerate":[37],"on":[40,91,136,143,179,189,239],"GPU.":[41],"However,":[42,87],"due":[43],"irregular":[46,96],"memory":[47,57,75,97],"access":[48,148],"pattern":[49,149],"BFS,":[51],"great":[53],"number":[54],"divergent":[58],"accesses":[59,98],"harm":[60],"efficiency":[62],"GPU":[64,92,137,221],"dramatically.":[65],"Data":[66],"prefetching":[67,89,114,140,158,166,177,224,234],"can":[68,205],"fetch":[69],"useful":[70],"data":[71,124,133,146,176,196,245],"into":[72],"on-chip":[74],"in":[76,227,262,275],"advance":[77],"reduce":[79],"latency":[81],"accessing":[83],"off-chip":[85],"memory.":[86],"traditional":[88],"techniques":[90],"cannot":[93],"deal":[94],"with":[95,218,222],"efficiently.":[99],"By":[100],"analyzing":[101],"BFS":[102,241],"algorithms":[103],"GPU,":[105],"we":[106,129,153,248],"find":[107],"an":[108,112,155],"opportunity":[109],"design":[111],"efficient":[113],"mechanism":[115,235],"by":[116],"using":[117],"explicit":[119],"information":[120],"structure.":[125],"this":[127],"paper,":[128],"propose":[130],"DSAP,":[131],"structure-aware":[134],"prefetcher":[135],"that":[138,219],"generates":[139],"requests":[141],"based":[142,178],"well-defined":[145],"structure":[147],"BFS.":[151],"Also,":[152,247],"introduce":[154],"adaptive":[156],"fine-grain":[157],"management":[159],"adjust":[161],"status":[163],"granularity":[167],"dynamically":[168],"balance":[170],"cache":[172],"resource":[173],"contention":[174],"utilization":[181],"prefetched":[184],"data.":[185],"We":[186],"implement":[187],"DSAP":[188,204],"GPGPU-sim":[191],"simulator":[192],"evaluate":[194],"six":[195],"sets":[197],"from":[198],"three":[199],"different":[200],"kinds":[201],"achieve":[206],"geometrical":[208],"mean":[209],"IPC":[210],"improvement":[211],"28%,":[213],"up":[214,265],"48.4%,":[216],"compared":[217],"no":[223,237],"technique,":[225],"while":[226],"contrast,":[228],"stride-based":[230],"global":[231],"history":[232],"buffer":[233],"makes":[236],"effects":[238],"improving":[240],"performance":[242],"these":[244],"sets.":[246],"use":[249],"GPUWattch":[251],"estimate":[253],"power":[255,259],"consumption,":[256],"increases":[260],"8.3%":[261],"average":[263],"11.8%,":[267],"but":[268],"total":[270],"energy":[271],"cost":[272],"drops":[273],"15.1%":[274],"average.":[276]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
