{"id":"https://openalex.org/W1968723134","doi":"https://doi.org/10.1145/1188455.1188672","title":"S07---GPGPU","display_name":"S07---GPGPU","publication_year":2006,"publication_date":"2006-01-01","ids":{"openalex":"https://openalex.org/W1968723134","doi":"https://doi.org/10.1145/1188455.1188672","mag":"1968723134"},"language":"en","primary_location":{"id":"doi:10.1145/1188455.1188672","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1188455.1188672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2006 ACM/IEEE conference on Supercomputing  - SC '06","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039425451","display_name":"David Luebke","orcid":"https://orcid.org/0000-0002-8206-5785"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"David Luebke","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021480559","display_name":"Mark Harris","orcid":"https://orcid.org/0000-0003-3537-6211"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mark Harris","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049041008","display_name":"Naga K. Govindaraju","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naga Govindaraju","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087647732","display_name":"Aaron Lefohn","orcid":"https://orcid.org/0009-0002-6526-0922"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aaron Lefohn","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108461485","display_name":"Mike Houston","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mike Houston","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028662746","display_name":"John D. Owens","orcid":"https://orcid.org/0000-0001-6582-8237"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"John Owens","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112106776","display_name":"Mark Segal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mark Segal","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038314088","display_name":"Matthew Papakipos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matthew Papakipos","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020493351","display_name":"Ian Buck","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ian Buck","raw_affiliation_strings":[""],"affiliations":[{"raw_affiliation_string":"","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5039425451"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.78650591,"has_fulltext":false,"cited_by_count":147,"citation_normalized_percentile":{"value":0.97993311,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"208","last_page":"208"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.8703254461288452},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8571764826774597},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.7078257203102112},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6604098081588745},{"id":"https://openalex.org/keywords/real-time-computer-graphics","display_name":"Real-time computer graphics","score":0.5666748285293579},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5569682121276855},{"id":"https://openalex.org/keywords/graphics-hardware","display_name":"Graphics hardware","score":0.47499194741249084},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.4537017047405243},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.42433395981788635},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.4196156859397888},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.4184392988681793},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.41304126381874084},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.34258270263671875},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3068638741970062},{"id":"https://openalex.org/keywords/3d-computer-graphics","display_name":"3D computer graphics","score":0.22931483387947083}],"concepts":[{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.8703254461288452},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8571764826774597},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.7078257203102112},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6604098081588745},{"id":"https://openalex.org/C537207887","wikidata":"https://www.wikidata.org/wiki/Q2816483","display_name":"Real-time computer graphics","level":4,"score":0.5666748285293579},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5569682121276855},{"id":"https://openalex.org/C18945957","wikidata":"https://www.wikidata.org/wiki/Q5597193","display_name":"Graphics hardware","level":3,"score":0.47499194741249084},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.4537017047405243},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.42433395981788635},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.4196156859397888},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.4184392988681793},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.41304126381874084},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.34258270263671875},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3068638741970062},{"id":"https://openalex.org/C66629338","wikidata":"https://www.wikidata.org/wiki/Q189177","display_name":"3D computer graphics","level":3,"score":0.22931483387947083}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1188455.1188672","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1188455.1188672","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2006 ACM/IEEE conference on Supercomputing  - SC '06","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2393747601","https://openalex.org/W2796337470","https://openalex.org/W2120385681","https://openalex.org/W2171605838","https://openalex.org/W1509422975","https://openalex.org/W82742382","https://openalex.org/W4249671011","https://openalex.org/W2763192925","https://openalex.org/W2046434380","https://openalex.org/W2141194949"],"abstract_inverted_index":{"The":[0],"graphics":[1,19,49,88,146],"processor":[2],"(GPU)":[3],"on":[4,61,76,87,142],"today's":[5],"commodity":[6],"video":[7],"cards":[8],"has":[9],"evolved":[10],"into":[11,127],"an":[12,68],"extremely":[13],"powerful":[14],"and":[15,25,39,103,108,120],"flexible":[16],"processor.":[17],"Modern":[18],"architectures":[20],"provide":[21,125],"tremendous":[22],"memory":[23],"bandwidth":[24],"computational":[26,53,93],"horsepower,":[27],"with":[28],"dozens":[29],"of":[30,70,84,116,139,145],"fully":[31],"programmable":[32],"shading":[33],"units":[34],"that":[35],"support":[36],"vector":[37],"operations":[38],"IEEE":[40],"floating":[41],"point":[42],"precision.":[43],"High-level":[44],"languages":[45],"have":[46,65],"emerged":[47],"for":[48,58],"hardware,":[50],"making":[51],"this":[52,122],"power":[54],"accessible.":[55],"GPGPU":[56,63,132],"stands":[57],"\"General-Purpose":[59],"Computation":[60],"GPUs\".":[62],"researchers":[64],"achieved":[66],"over":[67,73],"order":[69],"magnitude":[71],"speedup":[72],"modern":[74],"CPUs":[75],"some":[77],"non-graphics":[78],"problems.This":[79],"course":[80],"provides":[81],"detailed":[82],"coverage":[83],"general-purpose":[85,143],"computation":[86],"hardware.":[89,147],"We":[90,113],"emphasize":[91],"core":[92],"building":[94],"blocks,":[95],"ranging":[96],"from":[97],"linear":[98],"algebra":[99],"to":[100,124,129],"database":[101],"queries,":[102],"review":[104],"the":[105],"tools,":[106],"perils,":[107],"strategies":[109],"in":[110],"GPU":[111,117],"programming.":[112],"present":[114,136],"analysis":[115,123],"performance":[118],"characteristics,":[119],"use":[121],"insight":[126],"how":[128],"build":[130],"efficient":[131],"algorithms.":[133],"Finally":[134],"we":[135],"a":[137],"set":[138],"case":[140],"studies":[141],"applications":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":16},{"year":2014,"cited_by_count":14},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":11}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
