{"id":"https://openalex.org/W1971367716","doi":"https://doi.org/10.1109/ipdps.2014.59","title":"Nitro: A Framework for Adaptive Code Variant Tuning","display_name":"Nitro: A Framework for Adaptive Code Variant Tuning","publication_year":2014,"publication_date":"2014-05-01","ids":{"openalex":"https://openalex.org/W1971367716","doi":"https://doi.org/10.1109/ipdps.2014.59","mag":"1971367716"},"language":"en","primary_location":{"id":"doi:10.1109/ipdps.2014.59","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2014.59","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 28th International Parallel and Distributed Processing Symposium","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033185286","display_name":"Saurav Muralidharan","orcid":"https://orcid.org/0000-0003-4024-3958"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Saurav Muralidharan","raw_affiliation_strings":["University of Utah, Salt Lake City, UT","University of Utah, Salt Lake City, UT, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Utah, Salt Lake City, UT","institution_ids":["https://openalex.org/I223532165"]},{"raw_affiliation_string":"University of Utah, Salt Lake City, UT, USA#TAB#","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057428462","display_name":"Manu Shantharam","orcid":null},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Manu Shantharam","raw_affiliation_strings":["University of Utah, Salt Lake City, UT","University of Utah, Salt Lake City, UT, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Utah, Salt Lake City, UT","institution_ids":["https://openalex.org/I223532165"]},{"raw_affiliation_string":"University of Utah, Salt Lake City, UT, USA#TAB#","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030152493","display_name":"Mary Hall","orcid":"https://orcid.org/0000-0002-3058-7573"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mary Hall","raw_affiliation_strings":["University of Utah, Salt Lake City, UT","University of Utah, Salt Lake City, UT, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Utah, Salt Lake City, UT","institution_ids":["https://openalex.org/I223532165"]},{"raw_affiliation_string":"University of Utah, Salt Lake City, UT, USA#TAB#","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024606205","display_name":"Michael Garland","orcid":"https://orcid.org/0000-0001-6093-7602"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]},{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Michael Garland","raw_affiliation_strings":["NVIDIA Corporation, Santa Clara, CA","[Nvidia Corporation, Santa Clara, CA, USA]"],"affiliations":[{"raw_affiliation_string":"NVIDIA Corporation, Santa Clara, CA","institution_ids":["https://openalex.org/I4210127875"]},{"raw_affiliation_string":"[Nvidia Corporation, Santa Clara, CA, USA]","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066242985","display_name":"Bryan Catanzaro","orcid":"https://orcid.org/0000-0003-0034-7728"},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]},{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Bryan Catanzaro","raw_affiliation_strings":["NVIDIA Corporation, Santa Clara, CA","[Nvidia Corporation, Santa Clara, CA, USA]"],"affiliations":[{"raw_affiliation_string":"NVIDIA Corporation, Santa Clara, CA","institution_ids":["https://openalex.org/I4210127875"]},{"raw_affiliation_string":"[Nvidia Corporation, Santa Clara, CA, USA]","institution_ids":["https://openalex.org/I1304085615"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5033185286"],"corresponding_institution_ids":["https://openalex.org/I223532165"],"apc_list":null,"apc_paid":null,"fwci":9.1363,"has_fulltext":false,"cited_by_count":65,"citation_normalized_percentile":{"value":0.98167249,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8297315835952759},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.6978476643562317},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5832499265670776},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.5648730993270874},{"id":"https://openalex.org/keywords/programmer","display_name":"Programmer","score":0.5578521490097046},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5366816520690918},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5204475522041321},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5061916708946228},{"id":"https://openalex.org/keywords/performance-tuning","display_name":"Performance tuning","score":0.4781016707420349},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.429871529340744},{"id":"https://openalex.org/keywords/sorting","display_name":"Sorting","score":0.4214444160461426},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.38894888758659363},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.38821548223495483},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.33481478691101074},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11703011393547058}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8297315835952759},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.6978476643562317},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5832499265670776},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.5648730993270874},{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.5578521490097046},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5366816520690918},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5204475522041321},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5061916708946228},{"id":"https://openalex.org/C2777138346","wikidata":"https://www.wikidata.org/wiki/Q1714153","display_name":"Performance tuning","level":2,"score":0.4781016707420349},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.429871529340744},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.4214444160461426},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38894888758659363},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38821548223495483},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.33481478691101074},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11703011393547058}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ipdps.2014.59","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2014.59","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 28th International Parallel and Distributed Processing Symposium","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.671.5259","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.671.5259","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.utah.edu/%7Esauravm/docs/nitro_ipdps2014.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W57989469","https://openalex.org/W113569212","https://openalex.org/W147926632","https://openalex.org/W1483287332","https://openalex.org/W1492936035","https://openalex.org/W1495775210","https://openalex.org/W1536852470","https://openalex.org/W1556531089","https://openalex.org/W1569090332","https://openalex.org/W1570754865","https://openalex.org/W1631114303","https://openalex.org/W1714472976","https://openalex.org/W1851570257","https://openalex.org/W1884140786","https://openalex.org/W1972209410","https://openalex.org/W1980714869","https://openalex.org/W1985291160","https://openalex.org/W1991591392","https://openalex.org/W2000873501","https://openalex.org/W2014244478","https://openalex.org/W2035080386","https://openalex.org/W2062060002","https://openalex.org/W2072707864","https://openalex.org/W2085118703","https://openalex.org/W2099625934","https://openalex.org/W2104512032","https://openalex.org/W2106057110","https://openalex.org/W2107699930","https://openalex.org/W2112502633","https://openalex.org/W2121546953","https://openalex.org/W2124244761","https://openalex.org/W2126793563","https://openalex.org/W2128853364","https://openalex.org/W2130289795","https://openalex.org/W2135682468","https://openalex.org/W2136628731","https://openalex.org/W2136952590","https://openalex.org/W2148603752","https://openalex.org/W2153635508","https://openalex.org/W2154786353","https://openalex.org/W2158626113","https://openalex.org/W2161938901","https://openalex.org/W2314944927","https://openalex.org/W2903158431","https://openalex.org/W3003751469","https://openalex.org/W3145506805","https://openalex.org/W3152199537","https://openalex.org/W4243796884","https://openalex.org/W4247050054","https://openalex.org/W4251512373","https://openalex.org/W6604649183","https://openalex.org/W6629097924","https://openalex.org/W6629236817","https://openalex.org/W6637469547","https://openalex.org/W6639344521","https://openalex.org/W6678476493","https://openalex.org/W6679013332","https://openalex.org/W6682805176","https://openalex.org/W6764477354"],"related_works":["https://openalex.org/W2379153735","https://openalex.org/W2046172023","https://openalex.org/W2170146914","https://openalex.org/W2972896947","https://openalex.org/W2083974823","https://openalex.org/W2355105570","https://openalex.org/W2072751097","https://openalex.org/W4237177615","https://openalex.org/W2289257917","https://openalex.org/W3007026952"],"abstract_inverted_index":{"Autotuning":[0],"systems":[1],"intelligently":[2],"navigate":[3],"a":[4,11,20,30,50,83,93],"search":[5],"space":[6],"of":[7,10,38,44,72,129,132],"possible":[8],"implementations":[9,43],"computation":[12],"to":[13,56,81,103],"find":[14],"the":[15,45,65,70,101,105,130],"implementation(s)":[16],"that":[17,35,53,63,91,146],"best":[18],"meets":[19],"specific":[21],"optimization":[22],"criteria,":[23],"usually":[24],"performance.":[25],"This":[26],"paper":[27],"describes":[28],"Nitro,":[29],"programmer-directed":[31],"auto":[32],"tuning":[33,37],"framework":[34],"facilitates":[36],"code":[39,58],"variants,":[40],"or":[41],"alternative":[42],"same":[46],"computation.":[47],"Nitro":[48,98,145],"provides":[49],"library":[51],"interface":[52],"permits":[54],"programmers":[55],"express":[57],"variants":[59,73,125,133],"along":[60],"with":[61,110],"meta-information":[62],"aids":[64],"system":[66],"in":[67,144],"selecting":[68],"among":[69],"set":[71],"at":[74],"run":[75],"time.":[76],"Machine":[77],"learning":[78],"is":[79,96],"employed":[80],"build":[82],"model":[84,102],"through":[85,135],"training":[86,149],"on":[87],"this":[88],"meta-information,":[89],"so":[90],"when":[92],"new":[94],"input":[95],"presented,":[97],"can":[99],"consult":[100],"select":[104],"appropriate":[106],"variant.":[107],"In":[108],"experiments":[109],"five":[111],"real-world":[112],"irregular":[113],"GPU":[114],"benchmarks":[115],"from":[116],"sparse":[117],"numerical":[118],"methods,":[119],"graph":[120],"computations":[121],"and":[122,142,151],"sorting,":[123],"Nitro-tuned":[124],"achieve":[126],"over":[127],"93%":[128],"performance":[131],"selected":[134],"exhaustive":[136],"search.":[137],"Further,":[138],"we":[139],"describe":[140],"optimizations":[141],"heuristics":[143],"substantially":[147],"reduce":[148],"time":[150],"other":[152],"overheads.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":10},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":10},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":14},{"year":2015,"cited_by_count":5}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
