{"id":"https://openalex.org/W2613196900","doi":"https://doi.org/10.1145/3078155.3078178","title":"Modeling Explicit SIMD Programming With Subgroup Functions","display_name":"Modeling Explicit SIMD Programming With Subgroup Functions","publication_year":2017,"publication_date":"2017-05-10","ids":{"openalex":"https://openalex.org/W2613196900","doi":"https://doi.org/10.1145/3078155.3078178","mag":"2613196900"},"language":"en","primary_location":{"id":"doi:10.1145/3078155.3078178","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3078155.3078178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th International Workshop on OpenCL","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016139025","display_name":"Ben Ashbaugh","orcid":"https://orcid.org/0009-0003-1511-2021"},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Ben Ashbaugh","raw_affiliation_strings":["Intel Corporation"],"affiliations":[{"raw_affiliation_string":"Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046136666","display_name":"Biju George","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Biju George","raw_affiliation_strings":["Intel Corporation"],"affiliations":[{"raw_affiliation_string":"Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5016139025"],"corresponding_institution_ids":["https://openalex.org/I4210158342"],"apc_list":null,"apc_paid":null,"fwci":0.2253,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.46707941,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11522","display_name":"VLSI and FPGA Design Techniques","score":0.9886000156402588,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6765509843826294},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.5314815044403076},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4505782425403595},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.37939703464508057}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6765509843826294},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.5314815044403076},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4505782425403595},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.37939703464508057}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3078155.3078178","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3078155.3078178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th International Workshop on OpenCL","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.44999998807907104,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":1,"referenced_works":["https://openalex.org/W2124993854"],"related_works":["https://openalex.org/W1439745913","https://openalex.org/W1584265037","https://openalex.org/W2009882312","https://openalex.org/W1515082385","https://openalex.org/W1585350690","https://openalex.org/W3096209535","https://openalex.org/W2008876287","https://openalex.org/W1496703677","https://openalex.org/W3005521981","https://openalex.org/W4245302940"],"abstract_inverted_index":{"Traditionally,":[0],"programs":[1],"that":[2,31],"run":[3],"on":[4,65],"an":[5],"OpenCL\u2122":[6],"device":[7],"are":[8],"written":[9],"as":[10],"\"implicit":[11,96],"SIMD\"":[12,78,97],"(Single":[13,19],"Instruction,":[14,20],"Multiple":[15,21],"Data)":[16],"or":[17],"\"SIMT\"":[18],"Thread)":[22],"kernels.":[23,110],"This":[24,81],"is":[25,45],"a":[26,61,66,75],"convenient":[27],"and":[28,104],"powerful":[29],"representation":[30],"can":[32],"target":[33],"massively":[34],"parallel":[35,41],"OpenCL":[36,54,98,109],"devices":[37],"without":[38],"writing":[39],"tricky":[40],"code,":[42],"but":[43],"it":[44],"insufficient":[46],"to":[47,90,100,108],"optimally":[48],"represent":[49,91],"some":[50,53],"features":[51],"of":[52,68,74],"devices.":[55],"In":[56],"particular,":[57],"\"block":[58],"operations\",":[59],"where":[60],"single":[62],"operation":[63],"works":[64],"collection":[67],"data":[69],"items,":[70],"have":[71],"required":[72],"use":[73],"trickier":[76],"\"explicit":[77],"programming":[79],"paradigm.":[80],"paper":[82],"describes":[83],"how":[84],"subgroup":[85],"built-in":[86],"functions":[87],"were":[88],"used":[89],"block":[92],"operations":[93],"in":[94],"traditional":[95],"kernels,":[99],"improve":[101],"kernel":[102],"efficiency":[103],"add":[105],"new":[106],"capabilities":[107]},"counts_by_year":[{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
