{"id":"https://openalex.org/W2001784723","doi":"https://doi.org/10.1145/2254064.2254067","title":"Adaptive input-aware compilation for graphics engines","display_name":"Adaptive input-aware compilation for graphics engines","publication_year":2012,"publication_date":"2012-06-11","ids":{"openalex":"https://openalex.org/W2001784723","doi":"https://doi.org/10.1145/2254064.2254067","mag":"2001784723"},"language":"en","primary_location":{"id":"doi:10.1145/2254064.2254067","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2254064.2254067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM SIGPLAN Conference on Programming Language Design and Implementation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058642630","display_name":"Mehrzad Samadi","orcid":"https://orcid.org/0000-0002-3581-1255"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mehrzad Samadi","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071212745","display_name":"Amir Hormati","orcid":"https://orcid.org/0009-0002-5786-3301"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amir Hormati","raw_affiliation_strings":["Microsoft Research, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014835828","display_name":"Mojtaba Mehrara","orcid":null},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mojtaba Mehrara","raw_affiliation_strings":["NVIDIA Research, Santa Clara, CA, USA",", NVIDIA Research, Santa Clara, CA, USA"],"affiliations":[{"raw_affiliation_string":"NVIDIA Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210127875"]},{"raw_affiliation_string":", NVIDIA Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065946847","display_name":"Janghaeng Lee","orcid":"https://orcid.org/0009-0005-1915-6077"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Janghaeng Lee","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002075773","display_name":"Scott Mahlke","orcid":"https://orcid.org/0000-0002-0438-0616"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Scott Mahlke","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5058642630"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":7.2514,"has_fulltext":false,"cited_by_count":34,"citation_normalized_percentile":{"value":0.97414278,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"13","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9132993817329407},{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.8149563074111938},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.5625870227813721},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.5193315744400024},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49969959259033203},{"id":"https://openalex.org/keywords/memory-hierarchy","display_name":"Memory hierarchy","score":0.46326568722724915},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4183875322341919},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.36595600843429565},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.2601924538612366},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2504439949989319},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.17003238201141357}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9132993817329407},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.8149563074111938},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5625870227813721},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.5193315744400024},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49969959259033203},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.46326568722724915},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4183875322341919},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.36595600843429565},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.2601924538612366},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2504439949989319},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.17003238201141357}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2254064.2254067","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2254064.2254067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM SIGPLAN Conference on Programming Language Design and Implementation","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4399999976158142,"display_name":"Responsible consumption and production","id":"https://metadata.un.org/sdg/12"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1537323515","https://openalex.org/W1568192366","https://openalex.org/W1599739018","https://openalex.org/W1604019176","https://openalex.org/W1782174992","https://openalex.org/W1976458646","https://openalex.org/W1980225486","https://openalex.org/W1987588924","https://openalex.org/W1991591392","https://openalex.org/W1992851788","https://openalex.org/W2016888570","https://openalex.org/W2032309817","https://openalex.org/W2065392434","https://openalex.org/W2098426571","https://openalex.org/W2111354435","https://openalex.org/W2122080725","https://openalex.org/W2129232868","https://openalex.org/W2130285523","https://openalex.org/W2134431066","https://openalex.org/W2134616937","https://openalex.org/W2138163628","https://openalex.org/W2138659362","https://openalex.org/W2140375692","https://openalex.org/W2157729530","https://openalex.org/W2159350554","https://openalex.org/W2159456929","https://openalex.org/W2159481344","https://openalex.org/W2160786443","https://openalex.org/W2163229756","https://openalex.org/W2165100134","https://openalex.org/W2167334577","https://openalex.org/W2170058712","https://openalex.org/W2170634604","https://openalex.org/W4231589243","https://openalex.org/W4255468259"],"related_works":["https://openalex.org/W3020739840","https://openalex.org/W2913998709","https://openalex.org/W3177128669","https://openalex.org/W4386875822","https://openalex.org/W4385574943","https://openalex.org/W2769189194","https://openalex.org/W1537323515","https://openalex.org/W2353852602","https://openalex.org/W2120249721","https://openalex.org/W4293390906"],"abstract_inverted_index":{"While":[0],"graphics":[1],"processing":[2],"units":[3],"(GPUs)":[4],"provide":[5],"low-cost":[6],"and":[7,45,113,124,140,170,197,228,232],"efficient":[8,134],"platforms":[9],"for":[10,61],"accelerating":[11],"high":[12],"performance":[13,19],"computations,":[14],"the":[15,36,117,137,151,157,167,201,206],"tedious":[16],"process":[17],"of":[18,31,76,120,136,150,181,205],"tuning":[20],"required":[21],"to":[22,28,35,92,132,226],"optimize":[23,229],"applications":[24,107,230],"is":[25,53,153,179],"an":[26,73,87],"obstacle":[27],"wider":[29],"adoption":[30],"GPUs.":[32,58],"In":[33,81],"addition":[34],"programmability":[37],"challenges":[38],"posed":[39],"by":[40],"GPU's":[41],"complex":[42],"memory":[43,138],"hierarchy":[44,139],"parallelism":[46],"model,":[47],"a":[48,62,67,77,109,146,163],"well-known":[49],"application":[50,152],"design":[51],"problem":[52],"target":[54],"portability":[55,99],"across":[56,219],"different":[57,220],"However,":[59],"even":[60],"single":[63],"GPU":[64,221],"target,":[65],"changing":[66],"program's":[68],"input":[69,98,121,195,202],"characteristics":[70],"can":[71,185],"make":[72,133],"already-optimized":[74],"implementation":[75],"program":[78,159],"perform":[79,162,186],"poorly.":[80],"this":[82,94,102],"work,":[83],"we":[84,212],"propose":[85],"Adaptic,":[86],"adaptive":[88],"input-aware":[89,128,215],"compilation":[90],"system":[91],"tackle":[93],"important,":[95],"yet":[96],"overlooked,":[97],"problem.":[100],"Using":[101],"system,":[103],"programmers":[104],"develop":[105],"their":[106,190],"in":[108],"high-level":[110],"streaming":[111],"language":[112],"let":[114],"Adaptic":[115,168,178],"undertake":[116],"difficult":[118],"task":[119],"portable":[122],"optimizations":[123,129],"code":[125],"generation.":[126],"Several":[127],"are":[130,217],"introduced":[131],"use":[135],"customize":[141],"thread":[142],"composition.":[143],"At":[144],"runtime,":[145],"properly":[147],"optimized":[148],"version":[149],"executed":[154],"based":[155],"on":[156,187],"actual":[158],"input.":[160],"We":[161],"head-to-head":[164],"comparison":[165],"between":[166],"generated":[169],"hand-optimized":[171,191,207],"CUDA":[172],"programs.":[173],"The":[174],"results":[175,216],"show":[176,213],"that":[177,184,214],"capable":[180],"generating":[182],"codes":[183],"par":[188],"with":[189],"counterparts":[192],"over":[193],"certain":[194],"ranges":[196],"outperform":[198],"them":[199,234],"when":[200],"falls":[203],"out":[204],"programs'":[208],"\"comfort":[209],"zone\".":[210],"Furthermore,":[211],"sustainable":[218],"targets":[222],"making":[223],"it":[224],"possible":[225],"write":[227],"once":[231],"run":[233],"anywhere.":[235]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":7},{"year":2014,"cited_by_count":11},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
