{"id":"https://openalex.org/W2791759077","doi":"https://doi.org/10.1145/3168810","title":"SIMD intrinsics on managed language runtimes","display_name":"SIMD intrinsics on managed language runtimes","publication_year":2018,"publication_date":"2018-02-24","ids":{"openalex":"https://openalex.org/W2791759077","doi":"https://doi.org/10.1145/3168810","mag":"2791759077"},"language":"en","primary_location":{"id":"doi:10.1145/3168810","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3168810","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Symposium on Code Generation and Optimization","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027784711","display_name":"Alen Stojanov","orcid":null},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Alen Stojanov","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034625139","display_name":"Ivaylo Toskov","orcid":null},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Ivaylo Toskov","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003153354","display_name":"Tiark Rompf","orcid":"https://orcid.org/0000-0002-2068-3238"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tiark Rompf","raw_affiliation_strings":["Purdue University, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076407181","display_name":"Markus P\u00fcschel","orcid":"https://orcid.org/0000-0001-8834-8551"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Markus P\u00fcschel","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5027784711"],"corresponding_institution_ids":["https://openalex.org/I35440088"],"apc_list":null,"apc_paid":null,"fwci":2.0197,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.85798093,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9114830493927002},{"id":"https://openalex.org/keywords/intrinsics","display_name":"Intrinsics","score":0.8830708861351013},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.6419072151184082},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.6409523487091064},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5869004726409912},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5509190559387207},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.5119965672492981},{"id":"https://openalex.org/keywords/java","display_name":"Java","score":0.484253853559494},{"id":"https://openalex.org/keywords/just-in-time-compilation","display_name":"Just-in-time compilation","score":0.48202598094940186},{"id":"https://openalex.org/keywords/metaprogramming","display_name":"Metaprogramming","score":0.4652819037437439}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9114830493927002},{"id":"https://openalex.org/C2908650547","wikidata":"https://www.wikidata.org/wiki/Q20999234","display_name":"Intrinsics","level":2,"score":0.8830708861351013},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6419072151184082},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.6409523487091064},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5869004726409912},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5509190559387207},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.5119965672492981},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.484253853559494},{"id":"https://openalex.org/C76782552","wikidata":"https://www.wikidata.org/wiki/Q110546","display_name":"Just-in-time compilation","level":3,"score":0.48202598094940186},{"id":"https://openalex.org/C35390924","wikidata":"https://www.wikidata.org/wiki/Q661075","display_name":"Metaprogramming","level":2,"score":0.4652819037437439}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3168810","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3168810","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Symposium on Code Generation and Optimization","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1498436455","https://openalex.org/W1567406606","https://openalex.org/W1986364436","https://openalex.org/W1988425770","https://openalex.org/W1991233955","https://openalex.org/W1999819296","https://openalex.org/W2003172590","https://openalex.org/W2004851214","https://openalex.org/W2021246880","https://openalex.org/W2059720667","https://openalex.org/W2071630526","https://openalex.org/W2085123413","https://openalex.org/W2094269821","https://openalex.org/W2099059741","https://openalex.org/W2111394443","https://openalex.org/W2119871735","https://openalex.org/W2143932292","https://openalex.org/W2147578933","https://openalex.org/W2154697693","https://openalex.org/W2233116163","https://openalex.org/W2533740594","https://openalex.org/W2647836899","https://openalex.org/W2741269719","https://openalex.org/W3028642772"],"related_works":["https://openalex.org/W4289638474","https://openalex.org/W2069504277","https://openalex.org/W2111180768","https://openalex.org/W4401454459","https://openalex.org/W2293666837","https://openalex.org/W2067411013","https://openalex.org/W2162270818","https://openalex.org/W4390503633","https://openalex.org/W2791759077","https://openalex.org/W4239295257"],"abstract_inverted_index":{"Managed":[0],"language":[1,127],"runtimes":[2],"such":[3],"as":[4,128],"the":[5,21,28,43,73,93,97,124,163,200,215],"Java":[6],"Virtual":[7],"Machine":[8],"(JVM)":[9],"provide":[10,155],"adequate":[11],"performance":[12],"for":[13,68,86],"a":[14,76,104,129,150],"wide":[15],"range":[16],"of":[17,27,49,75,82,131,159,183],"applications,":[18],"but":[19],"at":[20,116],"same":[22],"time,":[23],"they":[24],"lack":[25],"much":[26],"low-level":[29],"control":[30],"that":[31,46,107,166,180,198],"performance-minded":[32],"programmers":[33,109,121],"appreciate":[34],"in":[35,72,162],"languages":[36],"like":[37],"<pre>C/C++</pre>.":[38],"One":[39],"important":[40],"example":[41,145],"is":[42],"intrinsics":[44,71,94,172],"interface":[45],"exposes":[47],"instructions":[48],"SIMD":[50,171,184],"(Single":[51],"Instruction":[52],"Multiple":[53],"Data)":[54],"vector":[55,88,138],"ISAs":[56],"(Instruction":[57],"Set":[58],"Architectures).":[59],"In":[60,118],"this":[61,119,181],"paper":[62],"we":[63,90,102,148],"present":[64],"an":[65,144,156,195],"automatic":[66],"approach":[67,106,161],"including":[69],"native":[70,114,212],"runtime":[74],"managed":[77,216],"language.":[78],"Our":[79,177],"implementation":[80,158],"consists":[81],"two":[83],"parts.":[84],"First,":[85],"each":[87],"ISA,":[89],"automatically":[91],"generate":[92,111],"API":[95],"from":[96,173],"vendor-provided":[98],"XML":[99],"specification.":[100],"Second,":[101],"employ":[103],"metaprogramming":[105,186],"enables":[108,187],"to":[110,134,175,189],"and":[112,185,206,214],"load":[113],"code":[115,193,213],"runtime.":[117],"setting,":[120],"can":[122],"use":[123,146],"entire":[125],"high-level":[126,137],"kind":[130],"macro":[132],"system":[133],"define":[135],"new":[136],"APIs":[139],"with":[140],"zero":[141],"overhead.":[142],"As":[143],"case":[147],"show":[149],"variable":[151],"precision":[152],"API.":[153],"We":[154],"end-to-end":[157],"our":[160],"HotSpot":[164,202],"VM":[165],"supports":[167],"all":[168],"5912":[169],"Intel":[170],"<pre>MMX</pre>":[174],"<pre>AVX-512</pre>.":[176],"benchmarks":[178],"demonstrate":[179],"combination":[182],"developers":[188],"write":[190],"high-performance,":[191],"vectorized":[192,211],"on":[194],"unmodified":[196],"JVM":[197,217],"outperforms":[199],"auto-vectorizing":[201],"just-in-time":[203],"(JIT)":[204],"compiler":[205],"provides":[207],"tight":[208],"integration":[209],"between":[210],"ecosystem.":[218]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
