{"id":"https://openalex.org/W3149591378","doi":"https://doi.org/10.1109/cgo.2011.5764682","title":"Whole-function vectorization","display_name":"Whole-function vectorization","publication_year":2011,"publication_date":"2011-04-01","ids":{"openalex":"https://openalex.org/W3149591378","doi":"https://doi.org/10.1109/cgo.2011.5764682","mag":"3149591378"},"language":"en","primary_location":{"id":"doi:10.1109/cgo.2011.5764682","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo.2011.5764682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Symposium on Code Generation and Optimization (CGO 2011)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039836242","display_name":"Ralf Karrenberg","orcid":null},"institutions":[{"id":"https://openalex.org/I91712215","display_name":"Saarland University","ror":"https://ror.org/01jdpyv68","country_code":"DE","type":"education","lineage":["https://openalex.org/I91712215"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Ralf Karrenberg","raw_affiliation_strings":["University of Saarland, Germany"],"affiliations":[{"raw_affiliation_string":"University of Saarland, Germany","institution_ids":["https://openalex.org/I91712215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018809145","display_name":"Sebastian Hack","orcid":"https://orcid.org/0000-0002-3387-2134"},"institutions":[{"id":"https://openalex.org/I91712215","display_name":"Saarland University","ror":"https://ror.org/01jdpyv68","country_code":"DE","type":"education","lineage":["https://openalex.org/I91712215"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sebastian Hack","raw_affiliation_strings":["University of Saarland, Germany"],"affiliations":[{"raw_affiliation_string":"University of Saarland, Germany","institution_ids":["https://openalex.org/I91712215"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5039836242"],"corresponding_institution_ids":["https://openalex.org/I91712215"],"apc_list":null,"apc_paid":null,"fwci":5.4114,"has_fulltext":false,"cited_by_count":64,"citation_normalized_percentile":{"value":0.96317098,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"141","last_page":"150"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9055955410003662},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8074593544006348},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.7080004215240479},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.7038627862930298},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.6059730052947998},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.546760618686676},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.5433330535888672},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.46920910477638245},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.45261886715888977},{"id":"https://openalex.org/keywords/just-in-time-compilation","display_name":"Just-in-time compilation","score":0.43949267268180847},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.41146671772003174},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2258395254611969}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9055955410003662},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8074593544006348},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.7080004215240479},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.7038627862930298},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6059730052947998},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.546760618686676},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.5433330535888672},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.46920910477638245},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.45261886715888977},{"id":"https://openalex.org/C76782552","wikidata":"https://www.wikidata.org/wiki/Q110546","display_name":"Just-in-time compilation","level":3,"score":0.43949267268180847},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.41146671772003174},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2258395254611969}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cgo.2011.5764682","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo.2011.5764682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Symposium on Code Generation and Optimization (CGO 2011)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320323322","display_name":"Universit\u00e4t des Saarlandes","ror":"https://ror.org/01jdpyv68"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W127897580","https://openalex.org/W1591319746","https://openalex.org/W1593435500","https://openalex.org/W1966324811","https://openalex.org/W1975166067","https://openalex.org/W1976470975","https://openalex.org/W2064810595","https://openalex.org/W2078508340","https://openalex.org/W2078862445","https://openalex.org/W2083804777","https://openalex.org/W2099455734","https://openalex.org/W2101811680","https://openalex.org/W2105256472","https://openalex.org/W2112482891","https://openalex.org/W2118031182","https://openalex.org/W2127324789","https://openalex.org/W2135736783","https://openalex.org/W2140311411","https://openalex.org/W2147423491","https://openalex.org/W2524681034","https://openalex.org/W3016220765","https://openalex.org/W4213172915","https://openalex.org/W4246166885","https://openalex.org/W4247913514","https://openalex.org/W4248145683","https://openalex.org/W6605292869","https://openalex.org/W6635567801","https://openalex.org/W6641587366","https://openalex.org/W6675526518","https://openalex.org/W6727534126"],"related_works":["https://openalex.org/W2566637483","https://openalex.org/W2127324789","https://openalex.org/W3024308452","https://openalex.org/W4244894488","https://openalex.org/W4285390450","https://openalex.org/W2366442643","https://openalex.org/W2090268225","https://openalex.org/W2021715972","https://openalex.org/W2766828645","https://openalex.org/W2761732860"],"abstract_inverted_index":{"Data-parallel":[0],"programming":[1],"languages":[2,16,19,28,37,83],"are":[3,14],"an":[4],"important":[5],"component":[6],"in":[7,20,114,121,126,134,139],"today's":[8],"parallel":[9],"computing":[10],"landscape.":[11],"Among":[12],"those":[13,36,60],"domain-specific":[15,131],"like":[17,29],"shading":[18],"graphics":[21],"(HLSL,":[22],"GLSL,":[23],"RenderMan,":[24],"etc.)":[25],"and":[26,47,65,96,155,159],"\u201cgeneral-purpose\u201d":[27],"CUDA":[30],"or":[31,69],"OpenCL.":[32],"Current":[33],"implementations":[34],"of":[35,59,80,149],"on":[38,42,84,104],"CPUs":[39],"solely":[40],"rely":[41],"multi-threading":[43],"to":[44],"implement":[45],"parallelism":[46,52],"ignore":[48],"the":[49,55,66,152],"additional":[50],"intra-core":[51],"provided":[53],"by":[54,109],"SIMD":[56,87],"instruction":[57,71,88],"set":[58],"processors":[61],"(like":[62],"Intel's":[63],"SSE":[64],"upcoming":[67],"AVX":[68],"Larrabee":[70],"sets).":[72],"In":[73],"this":[74],"paper,":[75],"we":[76],"discuss":[77],"several":[78],"aspects":[79],"implementing":[81],"dataparallel":[82],"machines":[85],"with":[86],"sets.":[89],"Our":[90],"main":[91],"contribution":[92],"is":[93],"a":[94,110,127,130,140],"language-":[95],"platform-independent":[97],"code":[98,107],"transformation":[99],"that":[100],"performs":[101],"whole-function":[102],"vectorization":[103],"low-level":[105],"intermediate":[106],"given":[108],"control":[111],"flow":[112],"graph":[113],"SSA":[115],"form.":[116],"We":[117,144],"evaluate":[118],"our":[119],"technique":[120],"two":[122],"scenarios:":[123],"First,":[124],"incorporated":[125],"compiler":[128],"for":[129,151,161],"language":[132],"used":[133],"realtime":[135],"ray":[136,153],"tracing.":[137],"Second,":[138],"stand-alone":[141],"OpenCL":[142,163],"driver.":[143],"observe":[145],"average":[146],"speedup":[147],"factors":[148,156],"3.9":[150],"tracer":[154],"between":[157],"0.6":[158],"5.2":[160],"different":[162],"kernels.":[164]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":14},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":7}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
