{"id":"https://openalex.org/W2579915854","doi":"https://doi.org/10.1145/3018743.3018744","title":"Simple, Accurate, Analytical Time Modeling and Optimal Tile Size Selection for GPGPU Stencils","display_name":"Simple, Accurate, Analytical Time Modeling and Optimal Tile Size Selection for GPGPU Stencils","publication_year":2017,"publication_date":"2017-01-26","ids":{"openalex":"https://openalex.org/W2579915854","doi":"https://doi.org/10.1145/3018743.3018744","mag":"2579915854"},"language":"en","primary_location":{"id":"doi:10.1145/3018743.3018744","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3018743.3018744","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043311555","display_name":"Nirmal Prajapati","orcid":"https://orcid.org/0000-0002-7558-0340"},"institutions":[{"id":"https://openalex.org/I92446798","display_name":"Colorado State University","ror":"https://ror.org/03k1gpj17","country_code":"US","type":"education","lineage":["https://openalex.org/I92446798"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Nirmal Prajapati","raw_affiliation_strings":["Colorado State University, Fort Collins, CO, USA"],"affiliations":[{"raw_affiliation_string":"Colorado State University, Fort Collins, CO, USA","institution_ids":["https://openalex.org/I92446798"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026733593","display_name":"Waruna Ranasinghe","orcid":null},"institutions":[{"id":"https://openalex.org/I92446798","display_name":"Colorado State University","ror":"https://ror.org/03k1gpj17","country_code":"US","type":"education","lineage":["https://openalex.org/I92446798"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Waruna Ranasinghe","raw_affiliation_strings":["Colorado State University, Fort Collins, CO, USA"],"affiliations":[{"raw_affiliation_string":"Colorado State University, Fort Collins, CO, USA","institution_ids":["https://openalex.org/I92446798"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047953886","display_name":"Sanjay Rajopadhye","orcid":"https://orcid.org/0000-0002-4246-6066"},"institutions":[{"id":"https://openalex.org/I92446798","display_name":"Colorado State University","ror":"https://ror.org/03k1gpj17","country_code":"US","type":"education","lineage":["https://openalex.org/I92446798"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sanjay Rajopadhye","raw_affiliation_strings":["Colorado State University, Fort Collins, CO, USA"],"affiliations":[{"raw_affiliation_string":"Colorado State University, Fort Collins, CO, USA","institution_ids":["https://openalex.org/I92446798"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040381671","display_name":"Rumen Andonov","orcid":"https://orcid.org/0000-0003-4842-7102"},"institutions":[{"id":"https://openalex.org/I2802519937","display_name":"Institut de Recherche en Informatique et Syst\u00e8mes Al\u00e9atoires","ror":"https://ror.org/00myn0z94","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I2802204017","https://openalex.org/I2802519937","https://openalex.org/I28221208","https://openalex.org/I4210127572","https://openalex.org/I4210159245","https://openalex.org/I56067802"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Rumen Andonov","raw_affiliation_strings":["IRISA, Rennes, France"],"affiliations":[{"raw_affiliation_string":"IRISA, Rennes, France","institution_ids":["https://openalex.org/I2802519937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057625550","display_name":"Hristo Djidjev","orcid":"https://orcid.org/0000-0001-9286-8824"},"institutions":[{"id":"https://openalex.org/I4210131040","display_name":"Los Alamos National Security (United States)","ror":"https://ror.org/037ddaj94","country_code":"US","type":"company","lineage":["https://openalex.org/I4210131040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hristo Djidjev","raw_affiliation_strings":["LANL, Los Alamos, USA"],"affiliations":[{"raw_affiliation_string":"LANL, Los Alamos, USA","institution_ids":["https://openalex.org/I4210131040"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055618037","display_name":"Tobias Grosser","orcid":"https://orcid.org/0000-0003-3874-6003"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Tobias Grosser","raw_affiliation_strings":["ETH, Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH, Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5043311555"],"corresponding_institution_ids":["https://openalex.org/I92446798"],"apc_list":null,"apc_paid":null,"fwci":3.1544,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.93106322,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"163","last_page":"177"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12162","display_name":"Cellular Automata and Applications","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.9249327778816223},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8398033976554871},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.712218701839447},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6684674024581909},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6312747001647949},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.6173601150512695},{"id":"https://openalex.org/keywords/tile","display_name":"Tile","score":0.6070135831832886},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.57950359582901},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.5390922427177429},{"id":"https://openalex.org/keywords/vendor","display_name":"Vendor","score":0.5346246361732483},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.514130175113678},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4991309642791748},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.48380178213119507},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3510188162326813},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.26126211881637573},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.2420649528503418},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16769477725028992},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.13801616430282593}],"concepts":[{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.9249327778816223},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8398033976554871},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.712218701839447},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6684674024581909},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6312747001647949},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.6173601150512695},{"id":"https://openalex.org/C2780728851","wikidata":"https://www.wikidata.org/wiki/Q468402","display_name":"Tile","level":2,"score":0.6070135831832886},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.57950359582901},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5390922427177429},{"id":"https://openalex.org/C2777338717","wikidata":"https://www.wikidata.org/wiki/Q1762621","display_name":"Vendor","level":2,"score":0.5346246361732483},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.514130175113678},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4991309642791748},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.48380178213119507},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3510188162326813},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26126211881637573},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2420649528503418},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16769477725028992},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.13801616430282593},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3018743.3018744","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3018743.3018744","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W38784877","https://openalex.org/W76123042","https://openalex.org/W1503700136","https://openalex.org/W1504320321","https://openalex.org/W1513554765","https://openalex.org/W1514857085","https://openalex.org/W1561247983","https://openalex.org/W1567510187","https://openalex.org/W1571438983","https://openalex.org/W1825294837","https://openalex.org/W1963695588","https://openalex.org/W1964031104","https://openalex.org/W1964166152","https://openalex.org/W1967264375","https://openalex.org/W1968013322","https://openalex.org/W1970141743","https://openalex.org/W1973271197","https://openalex.org/W1973532523","https://openalex.org/W1979457157","https://openalex.org/W1987588924","https://openalex.org/W1993879355","https://openalex.org/W2003798513","https://openalex.org/W2028067303","https://openalex.org/W2032391783","https://openalex.org/W2034761517","https://openalex.org/W2039378765","https://openalex.org/W2050297469","https://openalex.org/W2055253125","https://openalex.org/W2055312318","https://openalex.org/W2070961300","https://openalex.org/W2077143534","https://openalex.org/W2084917734","https://openalex.org/W2085376012","https://openalex.org/W2095875205","https://openalex.org/W2097757554","https://openalex.org/W2097892124","https://openalex.org/W2100580246","https://openalex.org/W2104512032","https://openalex.org/W2107725926","https://openalex.org/W2111245822","https://openalex.org/W2113190809","https://openalex.org/W2119609467","https://openalex.org/W2120833345","https://openalex.org/W2121082877","https://openalex.org/W2124931755","https://openalex.org/W2129471558","https://openalex.org/W2129829929","https://openalex.org/W2135682468","https://openalex.org/W2144031643","https://openalex.org/W2146742876","https://openalex.org/W2149801340","https://openalex.org/W2151764765","https://openalex.org/W2153637321","https://openalex.org/W2154078685","https://openalex.org/W2154786353","https://openalex.org/W2167334577","https://openalex.org/W2171665936","https://openalex.org/W2212640437","https://openalex.org/W2983923412","https://openalex.org/W3196504174","https://openalex.org/W4213172915","https://openalex.org/W4245206864","https://openalex.org/W4255560897","https://openalex.org/W6630903078","https://openalex.org/W6633989748","https://openalex.org/W6643480586"],"related_works":["https://openalex.org/W1963859303","https://openalex.org/W2028798345","https://openalex.org/W2364044215","https://openalex.org/W2389600408","https://openalex.org/W240129890","https://openalex.org/W3048701459","https://openalex.org/W2149078538","https://openalex.org/W2080146221","https://openalex.org/W2370314112","https://openalex.org/W1912958759"],"abstract_inverted_index":{"Stencil":[0],"computations":[1],"are":[2,51],"an":[3],"important":[4],"class":[5],"of":[6,21,44],"compute":[7],"and":[8,17,27,31],"data":[9],"intensive":[10],"programs":[11],"that":[12,34,50],"occur":[13],"widely":[14],"in":[15],"scientific":[16],"engineeringapplications.":[18],"A":[19],"number":[20,43],"tools":[22],"use":[23],"sophisticated":[24],"tiling,":[25],"parallelization,":[26],"memory":[28],"mapping":[29],"strategies,":[30],"generate":[32],"code":[33,40],"relies":[35],"on":[36],"vendor-supplied":[37],"compilers.":[38],"This":[39],"has":[41],"a":[42],"parameters,":[45],"such":[46],"as":[47],"tile":[48],"sizes,":[49],"then":[52],"tuned":[53],"via":[54],"empirical":[55],"exploration.":[56]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":7}],"updated_date":"2025-11-25T21:42:39.735039","created_date":"2025-10-10T00:00:00"}
