{"id":"https://openalex.org/W3091355678","doi":"https://doi.org/10.1145/3412375","title":"SHASTA","display_name":"SHASTA","publication_year":2020,"publication_date":"2020-09-30","ids":{"openalex":"https://openalex.org/W3091355678","doi":"https://doi.org/10.1145/3412375","mag":"3091355678"},"language":"en","primary_location":{"id":"doi:10.1145/3412375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3412375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3412375","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3412375","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003288035","display_name":"Gokul Subramanian Ravi","orcid":"https://orcid.org/0000-0002-2334-2682"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gokul Subramanian Ravi","raw_affiliation_strings":["University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI"],"affiliations":[{"raw_affiliation_string":"University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034301665","display_name":"Joshua San Miguel","orcid":"https://orcid.org/0000-0002-6886-7183"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joshua San Miguel","raw_affiliation_strings":["University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI"],"affiliations":[{"raw_affiliation_string":"University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052869119","display_name":"Mikko H. Lipasti","orcid":"https://orcid.org/0000-0002-8535-9244"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mikko Lipasti","raw_affiliation_strings":["University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI"],"affiliations":[{"raw_affiliation_string":"University of Wisconsin Madison, Electrical and Computer Engineering, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003288035"],"corresponding_institution_ids":["https://openalex.org/I135310074"],"apc_list":null,"apc_paid":null,"fwci":0.2319,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.48890915,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":"17","issue":"4","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/approximation-algorithm","display_name":"Approximation algorithm","score":0.7553418874740601},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.722929835319519},{"id":"https://openalex.org/keywords/approximation-error","display_name":"Approximation error","score":0.7118749022483826},{"id":"https://openalex.org/keywords/approximation-theory","display_name":"Approximation theory","score":0.5436091423034668},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5167016983032227},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.48240387439727783},{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function approximation","score":0.443036288022995},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.42943498492240906},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.42473259568214417},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4220598042011261},{"id":"https://openalex.org/keywords/stochastic-approximation","display_name":"Stochastic approximation","score":0.410214900970459},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.36102986335754395},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.358474999666214},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3460637331008911},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.29622921347618103},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22282728552818298},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.1797126829624176},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13798591494560242}],"concepts":[{"id":"https://openalex.org/C148764684","wikidata":"https://www.wikidata.org/wiki/Q621751","display_name":"Approximation algorithm","level":2,"score":0.7553418874740601},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.722929835319519},{"id":"https://openalex.org/C122383733","wikidata":"https://www.wikidata.org/wiki/Q865920","display_name":"Approximation error","level":2,"score":0.7118749022483826},{"id":"https://openalex.org/C145242015","wikidata":"https://www.wikidata.org/wiki/Q774123","display_name":"Approximation theory","level":2,"score":0.5436091423034668},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5167016983032227},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.48240387439727783},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.443036288022995},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.42943498492240906},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.42473259568214417},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4220598042011261},{"id":"https://openalex.org/C55479107","wikidata":"https://www.wikidata.org/wiki/Q97663916","display_name":"Stochastic approximation","level":3,"score":0.410214900970459},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.36102986335754395},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.358474999666214},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3460637331008911},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29622921347618103},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22282728552818298},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.1797126829624176},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13798591494560242},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3412375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3412375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3412375","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3412375","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3412375","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3412375","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8799999952316284,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3091355678.pdf","grobid_xml":"https://content.openalex.org/works/W3091355678.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1937235839","https://openalex.org/W2020517863","https://openalex.org/W2049451779","https://openalex.org/W2057434193","https://openalex.org/W2080663940","https://openalex.org/W2111444234","https://openalex.org/W2119299853","https://openalex.org/W2135746559","https://openalex.org/W2147657366","https://openalex.org/W2165448367","https://openalex.org/W2169875292","https://openalex.org/W2170881177","https://openalex.org/W2187230075","https://openalex.org/W2319130110","https://openalex.org/W2518628311","https://openalex.org/W2535919346","https://openalex.org/W2554131156","https://openalex.org/W2580755288","https://openalex.org/W2625264446","https://openalex.org/W2896315621","https://openalex.org/W2900227741","https://openalex.org/W2906592685","https://openalex.org/W2913332302","https://openalex.org/W2916991310","https://openalex.org/W2947721658","https://openalex.org/W3098543951","https://openalex.org/W4240067093","https://openalex.org/W4240237526","https://openalex.org/W4250646739","https://openalex.org/W4255681033","https://openalex.org/W4376272906"],"related_works":["https://openalex.org/W1859974437","https://openalex.org/W2171221472","https://openalex.org/W3119645134","https://openalex.org/W189995875","https://openalex.org/W2108297731","https://openalex.org/W2737349826","https://openalex.org/W3177870706","https://openalex.org/W2087686193","https://openalex.org/W3091355678","https://openalex.org/W1997991996"],"abstract_inverted_index":{"A":[0],"key":[1],"requirement":[2],"for":[3,67,85,240,248],"efficient":[4,75],"general":[5,76,216,254],"purpose":[6,77,217,255],"approximate":[7,132],"computing":[8],"is":[9,176,188,200,221,270],"an":[10,74,159,226],"amalgamation":[11],"of":[12,27,96,108,119,225,234,280],"flexible":[13],"hardware":[14,139],"design":[15],"and":[16,33,102,123,229,266,269,282],"intelligent":[17],"application":[18,65],"tuning,":[19],"which":[20,114,206],"together":[21],"can":[22,259],"leverage":[23],"the":[24,30,35,116,164,169,185,191],"appropriate":[25],"amount":[26],"approximation":[28,55,78,110,121,161,187,218],"that":[29],"applications":[31,249],"engender":[32],"reap":[34],"best":[36],"efficiency":[37,167,196],"gains":[38],"from":[39],"them.":[40],"To":[41],"achieve":[42,89,144,163,274],"this,":[43],"we":[44],"have":[45],"identified":[46],"three":[47],"important":[48],"features":[49],"to":[50,88,131,135,143,157,162,262,273,285],"build":[51,73],"better":[52],"general-purpose":[53],"cross-layer":[54],"systems:":[56],"\u2460":[57],"individual":[58],"per-operation":[59],"(\u201cspatio-temporally":[60],"fine-grained\u201d)":[61],"approximation,":[62,68],"\u2461":[63],"hardware-cognizant":[64],"tuning":[66,174],"\u2462":[69],"systemwide":[70],"approximation-synergy.":[71],"We":[72],"system":[79],"called":[80,111],"SHASTA:":[81],"Synergic":[82,208],"HW-SW":[83],"Architecture":[84],"Spatio-Temporal":[86],"Approximation,":[87,113],"these":[90],"goals.":[91],"1":[92],"First,":[93],"in":[94,278],"terms":[95,279],"hardware,":[97],"SHASTA":[98,150,199,220,258],"approximates":[99],"both":[100],"compute":[101],"memory\u2014SHASTA":[103],"proposes":[104,151],"(a)":[105],"a":[106,125,152,179,203,214,237,252],"form":[107],"timing":[109,118],"Slack-control":[112],"controls":[115],"computation":[117],"each":[120],"operation":[122],"(b)":[124],"Dynamic":[126],"Pre-L1":[127],"Load":[128],"Approximation":[129,154],"mechanism":[130,156,175],"loads":[133],"prior":[134,286],"cache":[136],"access.":[137],"These":[138],"mechanisms":[140],"are":[141,246],"designed":[142,201],"fine-grained":[145],"spatio-temporally":[146],"diverse":[147],"approximation.":[148],"Next,":[149],"Hardware-cognizant":[153],"Tuning":[155],"tune":[158],"application\u2019s":[160,186],"optimum":[165],"execution":[166,195,267],"under":[168],"prescribed":[170],"error":[171,193],"tolerance.":[172],"The":[173],"implemented":[177,222],"atop":[178],"gradient":[180],"descent":[181],"algorithm":[182],"and,":[183],"thus,":[184],"tuned":[189,261],"along":[190],"steepest":[192],"vs.":[194],"gradient.":[197],"Finally,":[198],"with":[202],"full-system":[204],"perspective,":[205],"achieves":[207,230],"benefits":[209,245],"across":[210],"its":[211],"optimizations,":[212],"building":[213],"closer-to-ideal":[215],"system.":[219,257],"on":[223,251],"top":[224],"OOO":[227],"core":[228],"mean":[231],"speedups/energy":[232],"savings":[233],"20%\u201340%":[235],"over":[236],"non-approximate":[238],"baseline":[239],"greater":[241],"than":[242],"90%":[243],"accuracy\u2014these":[244],"substantial":[247],"executing":[250],"traditional":[253],"processing":[256],"be":[260],"specific":[263],"accuracy":[264],"constraints":[265],"metrics":[268],"quantitatively":[271],"shown":[272],"2\u201315\u00d7":[275],"higher":[276],"benefits,":[277],"performance":[281],"energy,":[283],"compared":[284],"work.":[287]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2020-10-08T00:00:00"}
