{"id":"https://openalex.org/W2529597500","doi":"https://doi.org/10.1109/iiswc.2016.7581278","title":"GPU concurrency choices in graph analytics","display_name":"GPU concurrency choices in graph analytics","publication_year":2016,"publication_date":"2016-09-01","ids":{"openalex":"https://openalex.org/W2529597500","doi":"https://doi.org/10.1109/iiswc.2016.7581278","mag":"2529597500"},"language":"en","primary_location":{"id":"doi:10.1109/iiswc.2016.7581278","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iiswc.2016.7581278","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on Workload Characterization (IISWC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023088436","display_name":"Masab Ahmad","orcid":"https://orcid.org/0000-0001-7786-3558"},"institutions":[{"id":"https://openalex.org/I140172145","display_name":"University of Connecticut","ror":"https://ror.org/02der9h97","country_code":"US","type":"education","lineage":["https://openalex.org/I140172145"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Masab Ahmad","raw_affiliation_strings":["University of Connecticut, Storrs, CT, USA"],"affiliations":[{"raw_affiliation_string":"University of Connecticut, Storrs, CT, USA","institution_ids":["https://openalex.org/I140172145"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048129220","display_name":"Omer Khan","orcid":"https://orcid.org/0000-0001-6293-7403"},"institutions":[{"id":"https://openalex.org/I140172145","display_name":"University of Connecticut","ror":"https://ror.org/02der9h97","country_code":"US","type":"education","lineage":["https://openalex.org/I140172145"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Omer Khan","raw_affiliation_strings":["University of Connecticut, Storrs, CT, USA"],"affiliations":[{"raw_affiliation_string":"University of Connecticut, Storrs, CT, USA","institution_ids":["https://openalex.org/I140172145"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5023088436"],"corresponding_institution_ids":["https://openalex.org/I140172145"],"apc_list":null,"apc_paid":null,"fwci":1.002,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.83412211,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"11","issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8815230131149292},{"id":"https://openalex.org/keywords/concurrency","display_name":"Concurrency","score":0.6630824208259583},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6577866077423096},{"id":"https://openalex.org/keywords/bulk-synchronous-parallel","display_name":"Bulk synchronous parallel","score":0.5388581156730652},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5148417353630066},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.4976241886615753},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.42876097559928894},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.42560523748397827},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4171290993690491},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4118473529815674},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4083763062953949},{"id":"https://openalex.org/keywords/parallel-algorithm","display_name":"Parallel algorithm","score":0.2037428319454193},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14541873335838318},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.11309829354286194},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.10587042570114136}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8815230131149292},{"id":"https://openalex.org/C193702766","wikidata":"https://www.wikidata.org/wiki/Q1414548","display_name":"Concurrency","level":2,"score":0.6630824208259583},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6577866077423096},{"id":"https://openalex.org/C156891508","wikidata":"https://www.wikidata.org/wiki/Q1004114","display_name":"Bulk synchronous parallel","level":3,"score":0.5388581156730652},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5148417353630066},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.4976241886615753},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.42876097559928894},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.42560523748397827},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4171290993690491},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4118473529815674},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4083763062953949},{"id":"https://openalex.org/C120373497","wikidata":"https://www.wikidata.org/wiki/Q1087987","display_name":"Parallel algorithm","level":2,"score":0.2037428319454193},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14541873335838318},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.11309829354286194},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.10587042570114136}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iiswc.2016.7581278","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iiswc.2016.7581278","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on Workload Characterization (IISWC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.44999998807907104}],"awards":[],"funders":[{"id":"https://openalex.org/F4320337628","display_name":"U.S. Naval Research Laboratory","ror":"https://ror.org/04d23a975"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W164384110","https://openalex.org/W208012252","https://openalex.org/W1541729506","https://openalex.org/W1593868476","https://openalex.org/W1717365219","https://openalex.org/W1896298204","https://openalex.org/W1955235267","https://openalex.org/W1983005303","https://openalex.org/W1997162567","https://openalex.org/W2000041758","https://openalex.org/W2000873501","https://openalex.org/W2018658595","https://openalex.org/W2021211271","https://openalex.org/W2026354831","https://openalex.org/W2035080386","https://openalex.org/W2041470524","https://openalex.org/W2043135347","https://openalex.org/W2062140606","https://openalex.org/W2080592089","https://openalex.org/W2090278477","https://openalex.org/W2096544401","https://openalex.org/W2100218206","https://openalex.org/W2107173440","https://openalex.org/W2112681514","https://openalex.org/W2115148068","https://openalex.org/W2146591355","https://openalex.org/W2147370410","https://openalex.org/W2158908968","https://openalex.org/W2160276892","https://openalex.org/W2160428323","https://openalex.org/W2169049902","https://openalex.org/W2169880332","https://openalex.org/W2274190190","https://openalex.org/W2319071579","https://openalex.org/W2474844316","https://openalex.org/W2951135776","https://openalex.org/W3004555699","https://openalex.org/W3006138624","https://openalex.org/W6608435233","https://openalex.org/W6635451513","https://openalex.org/W6677111876"],"related_works":["https://openalex.org/W4390608645","https://openalex.org/W4247566972","https://openalex.org/W2960264696","https://openalex.org/W3090563135","https://openalex.org/W2497432351","https://openalex.org/W4206777497","https://openalex.org/W4233347783","https://openalex.org/W2910064364","https://openalex.org/W4255224757","https://openalex.org/W2499527417"],"abstract_inverted_index":{"Graph":[0],"analytics":[1],"is":[2,69,154,165,176],"becoming":[3],"ever":[4],"more":[5],"ubiquitous":[6],"in":[7,14,20,28,54,93],"today's":[8],"world.":[9],"However,":[10,83],"situational":[11],"dynamic":[12],"changes":[13,19],"input":[15,117],"graphs,":[16],"such":[17,62],"as":[18,63],"traffic":[21],"and":[22,40],"weather":[23],"patterns,":[24],"lead":[25],"to":[26,35,47,73,88,140,167],"variations":[27,85],"concurrency.":[29,174],"Moreover,":[30,149],"graph":[31,76,109],"algorithms":[32,77],"are":[33,86,134],"known":[34],"have":[36],"data":[37],"dependent":[38],"loops":[39],"fine-grain":[41],"synchronization":[42],"that":[43,122,144,170,179],"makes":[44],"them":[45],"hard":[46],"scale":[48],"on":[49,79,112,136],"parallel":[50],"machines.":[51,82],"Recent":[52],"trends":[53],"computing":[55],"indicate":[56],"the":[57,157,184],"rise":[58],"of":[59,70,104,116,129,159],"massively-threaded":[60],"machines,":[61],"Graphic":[64],"Processing":[65],"Units":[66],"(GPUs).":[67],"It":[68,175],"paramount":[71],"importance":[72],"adopt":[74],"these":[75,80],"efficiently":[78],"GPU":[81,96,105,138,162,189],"concurrency":[84],"expected":[87],"play":[89],"a":[90,113,126,137,141,168],"formidable":[91],"role":[92],"achieving":[94],"good":[95],"performance.":[97,190],"This":[98],"paper":[99],"performs":[100],"an":[101,150],"in-depth":[102],"characterization":[103],"architectural":[106,186],"choices":[107,187],"for":[108],"benchmarks":[110],"executing":[111],"diverse":[114],"set":[115],"graphs.":[118],"The":[119],"analysis":[120],"shows":[121],"performance":[123,153],"improves":[124],"by":[125],"geometric":[127],"mean":[128],"40%":[130],"when":[131,156],"optimal":[132],"threads":[133,160],"spawned":[135],"relative":[139],"naive":[142],"choice":[143],"maximizes":[145],"total":[146],"thread":[147],"count.":[148],"additional":[151],"41%":[152],"achieved":[155],"number":[158],"per":[161],"work":[163],"group":[164],"reduced":[166],"setting":[169],"optimizes":[171],"exploitable":[172],"hardware":[173],"also":[177],"shown":[178],"algorithmic":[180],"auto-tuning":[181],"coupled":[182],"with":[183],"right":[185],"co-optimize":[188]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
