{"id":"https://openalex.org/W2566629575","doi":"https://doi.org/10.1145/3009837.3009846","title":"Rigorous floating-point mixed-precision tuning","display_name":"Rigorous floating-point mixed-precision tuning","publication_year":2016,"publication_date":"2016-12-22","ids":{"openalex":"https://openalex.org/W2566629575","doi":"https://doi.org/10.1145/3009837.3009846","mag":"2566629575"},"language":"en","primary_location":{"id":"doi:10.1145/3009837.3009846","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3009837.3009846","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th ACM SIGPLAN Symposium on Principles of Programming Languages","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055448005","display_name":"Wei\u2010Fan Chiang","orcid":"https://orcid.org/0000-0002-9240-1404"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wei-Fan Chiang","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014970220","display_name":"Mark Baranowski","orcid":null},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark Baranowski","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011013917","display_name":"Ian Briggs","orcid":"https://orcid.org/0000-0003-2454-2317"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ian Briggs","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049517241","display_name":"Alexey Solovyev","orcid":"https://orcid.org/0000-0001-8058-5317"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexey Solovyev","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069846379","display_name":"Ganesh Gopalakrishnan","orcid":"https://orcid.org/0000-0002-3705-0031"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ganesh Gopalakrishnan","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021217615","display_name":"Zvonimir Rakamari\u0107","orcid":"https://orcid.org/0000-0001-7946-0162"},"institutions":[{"id":"https://openalex.org/I223532165","display_name":"University of Utah","ror":"https://ror.org/03r0ha626","country_code":"US","type":"education","lineage":["https://openalex.org/I223532165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zvonimir Rakamari\u0107","raw_affiliation_strings":["University of Utah, USA"],"affiliations":[{"raw_affiliation_string":"University of Utah, USA","institution_ids":["https://openalex.org/I223532165"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5055448005"],"corresponding_institution_ids":["https://openalex.org/I223532165"],"apc_list":null,"apc_paid":null,"fwci":15.1996,"has_fulltext":false,"cited_by_count":115,"citation_normalized_percentile":{"value":0.9908189,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"300","last_page":"315"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10363","display_name":"Low-power high-performance VLSI design","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8086858987808228},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6701749563217163},{"id":"https://openalex.org/keywords/double-precision-floating-point-format","display_name":"Double-precision floating-point format","score":0.5699763298034668},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.5514605045318604},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49513354897499084},{"id":"https://openalex.org/keywords/single-precision-floating-point-format","display_name":"Single-precision floating-point format","score":0.4658755958080292},{"id":"https://openalex.org/keywords/quadratic-programming","display_name":"Quadratic programming","score":0.45813727378845215},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4536047875881195},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.44949695467948914},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.44907739758491516},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.44308406114578247},{"id":"https://openalex.org/keywords/accuracy-and-precision","display_name":"Accuracy and precision","score":0.4371755123138428},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.43449318408966064},{"id":"https://openalex.org/keywords/quadratic-growth","display_name":"Quadratic growth","score":0.42367714643478394},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3837924003601074},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.29450637102127075},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.27952319383621216}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8086858987808228},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6701749563217163},{"id":"https://openalex.org/C35912277","wikidata":"https://www.wikidata.org/wiki/Q1243369","display_name":"Double-precision floating-point format","level":3,"score":0.5699763298034668},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.5514605045318604},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49513354897499084},{"id":"https://openalex.org/C133095886","wikidata":"https://www.wikidata.org/wiki/Q1307173","display_name":"Single-precision floating-point format","level":3,"score":0.4658755958080292},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.45813727378845215},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4536047875881195},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.44949695467948914},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.44907739758491516},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.44308406114578247},{"id":"https://openalex.org/C202799725","wikidata":"https://www.wikidata.org/wiki/Q272035","display_name":"Accuracy and precision","level":2,"score":0.4371755123138428},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.43449318408966064},{"id":"https://openalex.org/C195956108","wikidata":"https://www.wikidata.org/wiki/Q7268362","display_name":"Quadratic growth","level":2,"score":0.42367714643478394},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3837924003601074},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.29450637102127075},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.27952319383621216},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3009837.3009846","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3009837.3009846","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th ACM SIGPLAN Symposium on Principles of Programming Languages","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W245868749","https://openalex.org/W1492936035","https://openalex.org/W1521746323","https://openalex.org/W1534398032","https://openalex.org/W1938260438","https://openalex.org/W1971367716","https://openalex.org/W1986944060","https://openalex.org/W1988579293","https://openalex.org/W1995574761","https://openalex.org/W2013585593","https://openalex.org/W2014244478","https://openalex.org/W2038705805","https://openalex.org/W2046104010","https://openalex.org/W2054870455","https://openalex.org/W2061091230","https://openalex.org/W2081368694","https://openalex.org/W2096654515","https://openalex.org/W2098156778","https://openalex.org/W2103953062","https://openalex.org/W2109955300","https://openalex.org/W2111593426","https://openalex.org/W2119352997","https://openalex.org/W2121050107","https://openalex.org/W2121344286","https://openalex.org/W2122738744","https://openalex.org/W2127145687","https://openalex.org/W2135120170","https://openalex.org/W2136504964","https://openalex.org/W2146782276","https://openalex.org/W2156828397","https://openalex.org/W2166280160","https://openalex.org/W2169004268","https://openalex.org/W2207050309","https://openalex.org/W2227234579","https://openalex.org/W2251636819","https://openalex.org/W2295915207","https://openalex.org/W2299696796","https://openalex.org/W2365032803","https://openalex.org/W2399231647","https://openalex.org/W2402469106","https://openalex.org/W2410059737","https://openalex.org/W2560674852","https://openalex.org/W2610467942","https://openalex.org/W2721065144","https://openalex.org/W2889447872","https://openalex.org/W2905880463","https://openalex.org/W2952432998","https://openalex.org/W6697772251","https://openalex.org/W6754531929"],"related_works":["https://openalex.org/W1564887326","https://openalex.org/W2239119680","https://openalex.org/W3150959508","https://openalex.org/W2116803521","https://openalex.org/W2773283032","https://openalex.org/W1571090276","https://openalex.org/W3215589575","https://openalex.org/W1973800584","https://openalex.org/W2185760795","https://openalex.org/W2336476964"],"abstract_inverted_index":{"Virtually":[0],"all":[1,61,121],"real-valued":[2],"computations":[3],"are":[4,45],"carried":[5],"out":[6],"using":[7,139],"floating-point":[8],"data":[9,17],"types":[10,18],"and":[11,53,83,102,126,169],"operations.":[12,129],"The":[13],"precision":[14,73,124,137,147,158,175],"of":[15,25,114,145,173],"these":[16],"must":[19],"be":[20],"set":[21],"with":[22],"the":[23,27,115,122,143,156,171,181,187],"goals":[24],"reducing":[26],"overall":[28],"round-off":[29],"error,":[30],"but":[31,213],"also":[32,131,185,214],"emphasizing":[33],"performance":[34],"improvements.":[35],"Often,":[36],"a":[37,56,69,104,111,199],"mixed-precision":[38,195,211],"allocation":[39,74,138],"achieves":[40],"this":[41,65],"optimum;":[42],"unfortunately,":[43],"there":[44],"no":[46],"techniques":[47],"available":[48],"to":[49,72,109,134,141,154,159,210],"compute":[50],"such":[51],"allocations":[52],"conservatively":[54],"meet":[55],"given":[57,116],"error":[58,84,182],"target":[59],"across":[60],"program":[62,108],"inputs.":[63],"In":[64],"work,":[66],"we":[67,179],"present":[68],"rigorous":[70],"approach":[71,91],"based":[75,86],"on":[76,87,198],"formal":[77],"analysis":[78,85],"via":[79],"Symbolic":[80],"Taylor":[81],"Expansions,":[82],"interval":[88],"functions.":[89],"This":[90],"is":[92],"implemented":[93],"in":[94,189,208],"an":[95],"automated":[96],"tool":[97],"called":[98],"FPTuner":[99,118,164],"that":[100],"generates":[101],"solves":[103],"quadratically":[105],"constrained":[106],"quadratic":[107],"obtain":[110],"precision-annotated":[112],"version":[113],"expression.":[117],"automatically":[119],"introduces":[120],"requisite":[123],"up":[125],"down":[127],"casting":[128],"It":[130],"allows":[132],"users":[133],"flexibly":[135],"control":[136],"constraints":[140],"cap":[142],"number":[144],"high":[146],"operators":[148,153,176],"as":[149,151,178],"well":[150],"group":[152],"allocate":[155],"same":[157],"facilitate":[160],"vectorization.":[161],"We":[162,184,203],"evaluate":[163],"by":[165],"tuning":[166],"several":[167],"benchmarks":[168],"measuring":[170],"proportion":[172],"lower":[174],"allocated":[177],"increase":[180],"threshold.":[183],"measure":[186],"reduction":[188],"energy":[190,206],"consumption":[191],"resulting":[192],"from":[193],"executing":[194],"tuned":[196],"code":[197],"real":[200],"hardware":[201],"platform.":[202],"observe":[204,215],"significant":[205],"savings":[207],"response":[209],"tuning,":[212],"situations":[216],"where":[217],"unexpected":[218],"compiler":[219],"behaviors":[220],"thwart":[221],"intended":[222],"optimizations.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":15},{"year":2021,"cited_by_count":15},{"year":2020,"cited_by_count":17},{"year":2019,"cited_by_count":19},{"year":2018,"cited_by_count":14},{"year":2017,"cited_by_count":9}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
