{"id":"https://openalex.org/W2110345435","doi":"https://doi.org/10.1145/1646461.1646463","title":"An integrated reduction technique for a double precision accumulator","display_name":"An integrated reduction technique for a double precision accumulator","publication_year":2009,"publication_date":"2009-11-15","ids":{"openalex":"https://openalex.org/W2110345435","doi":"https://doi.org/10.1145/1646461.1646463","mag":"2110345435"},"language":"en","primary_location":{"id":"doi:10.1145/1646461.1646463","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1646461.1646463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third International Workshop on High-Performance Reconfigurable Computing Technology and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081169433","display_name":"Krishna K. Nagar","orcid":"https://orcid.org/0009-0000-1114-2432"},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Krishna K. Nagar","raw_affiliation_strings":["University of South Carolina, Columbia, SC","University of South Carolina; Columbia; SC"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, Columbia, SC","institution_ids":["https://openalex.org/I155781252"]},{"raw_affiliation_string":"University of South Carolina; Columbia; SC","institution_ids":["https://openalex.org/I155781252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068236583","display_name":"Yan Zhang","orcid":"https://orcid.org/0000-0002-2155-9888"},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yan Zhang","raw_affiliation_strings":["University of South Carolina, Columbia, SC","University of South Carolina; Columbia; SC"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, Columbia, SC","institution_ids":["https://openalex.org/I155781252"]},{"raw_affiliation_string":"University of South Carolina; Columbia; SC","institution_ids":["https://openalex.org/I155781252"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001266986","display_name":"Jason D. Bakos","orcid":"https://orcid.org/0000-0002-0821-6258"},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason D. Bakos","raw_affiliation_strings":["University of South Carolina, Columbia, SC","University of South Carolina; Columbia; SC"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, Columbia, SC","institution_ids":["https://openalex.org/I155781252"]},{"raw_affiliation_string":"University of South Carolina; Columbia; SC","institution_ids":["https://openalex.org/I155781252"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0636,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.7832431,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"11","last_page":"18"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11034","display_name":"Digital Filter Design and Implementation","score":0.9761000275611877,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9740999937057495,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/accumulator","display_name":"Accumulator (cryptography)","score":0.8466224670410156},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7729960680007935},{"id":"https://openalex.org/keywords/hydraulic-accumulator","display_name":"Hydraulic accumulator","score":0.7633904218673706},{"id":"https://openalex.org/keywords/adder","display_name":"Adder","score":0.7507230639457703},{"id":"https://openalex.org/keywords/double-precision-floating-point-format","display_name":"Double-precision floating-point format","score":0.7267670035362244},{"id":"https://openalex.org/keywords/ieee-floating-point","display_name":"IEEE floating point","score":0.578911304473877},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.521054208278656},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.5188904404640198},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4794963002204895},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.43222954869270325},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.4273957908153534},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.41341632604599},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.38727161288261414},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.3449457883834839},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33192139863967896},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.32069021463394165},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11021977663040161},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09420862793922424}],"concepts":[{"id":"https://openalex.org/C2078106","wikidata":"https://www.wikidata.org/wiki/Q14906620","display_name":"Accumulator (cryptography)","level":2,"score":0.8466224670410156},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7729960680007935},{"id":"https://openalex.org/C19221803","wikidata":"https://www.wikidata.org/wiki/Q4668679","display_name":"Hydraulic accumulator","level":2,"score":0.7633904218673706},{"id":"https://openalex.org/C164620267","wikidata":"https://www.wikidata.org/wiki/Q376953","display_name":"Adder","level":3,"score":0.7507230639457703},{"id":"https://openalex.org/C35912277","wikidata":"https://www.wikidata.org/wiki/Q1243369","display_name":"Double-precision floating-point format","level":3,"score":0.7267670035362244},{"id":"https://openalex.org/C137231763","wikidata":"https://www.wikidata.org/wiki/Q828287","display_name":"IEEE floating point","level":3,"score":0.578911304473877},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.521054208278656},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.5188904404640198},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4794963002204895},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.43222954869270325},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.4273957908153534},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.41341632604599},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.38727161288261414},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3449457883834839},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33192139863967896},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.32069021463394165},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11021977663040161},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09420862793922424},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1646461.1646463","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1646461.1646463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third International Workshop on High-Performance Reconfigurable Computing Technology and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.183.760","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.183.760","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cse.sc.edu/%7Ejbakos/papers/hprcta09_paper.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4749820143","display_name":null,"funder_award_id":"CCF-0844951CCF-0915608","funder_id":"https://openalex.org/F4320337387","funder_display_name":"Division of Computing and Communication Foundations"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337387","display_name":"Division of Computing and Communication Foundations","ror":"https://ror.org/01mng8331"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1981252059","https://openalex.org/W2016512848","https://openalex.org/W2098158887","https://openalex.org/W2122485368","https://openalex.org/W2124408528","https://openalex.org/W2146369740","https://openalex.org/W2152567198","https://openalex.org/W2155385791","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4385326254","https://openalex.org/W2359966250","https://openalex.org/W2360903023","https://openalex.org/W2382515793","https://openalex.org/W2016198829","https://openalex.org/W1954749231","https://openalex.org/W2331088322","https://openalex.org/W2348821681","https://openalex.org/W2110345435","https://openalex.org/W1861262881"],"abstract_inverted_index":{"The":[0],"accumulation":[1],"operation,":[2],"An+1":[3,56],"=":[4],"An":[5,58],"+":[6],"X,":[7],"is":[8,38],"perhaps":[9],"one":[10],"of":[11,34,64,74,133,156],"the":[12,50,68,72,75,116,130],"most":[13],"fundamental":[14],"and":[15,21,42,57],"widely-used":[16],"operations":[17],"in":[18,146],"numerical":[19],"mathematics":[20],"digital":[22],"signal":[23],"processing.":[24],"However,":[25],"designing":[26],"double-precision":[27,36],"floating-point":[28,136],"accumulators":[29],"presents":[30],"a":[31,102,105,125,134,147,154],"unique":[32],"set":[33],"challenges:":[35],"addition":[37],"usually":[39],"deeply":[40],"pipelined":[41],"without":[43],"special":[44],"micro-architectural":[45],"or":[46],"data":[47,51],"scheduling":[48],"techniques,":[49],"hazard":[52],"that":[53,60,109],"exists":[54],"between":[55],"requires":[59,110],"each":[61,88],"new":[62],"value":[63],"X":[65],"delivered":[66],"to":[67,115,158],"accumulator":[69,108,141],"wait":[70],"for":[71,83,104],"latency":[73],"adder.":[76,137],"There":[77],"have":[78],"been":[79],"several":[80],"techniques":[81],"proposed":[82],"alleviating":[84],"this":[85,98,122],"problem,":[86],"but":[87],"carries":[89],"significant":[90],"overheads":[91],"and/or":[92],"restrictions":[93],"on":[94],"input":[95],"characteristics.":[96],"In":[97],"paper":[99],"we":[100,143],"present":[101],"design":[103,132],"double":[106],"precision":[107],"no":[111],"timing":[112],"overhead":[113],"relative":[114],"underlying":[117],"add":[118],"operation.":[119],"We":[120],"achieve":[121],"by":[123],"integrating":[124],"coalescing":[126],"reduction":[127],"circuit":[128],"within":[129],"low-level":[131],"base-converting":[135],"To":[138],"demonstrate":[139],"our":[140],"design,":[142],"use":[144],"it":[145],"sparse":[148],"matrix":[149],"vector":[150],"multiplication":[151],"architecture,":[152],"achieving":[153],"throughput":[155],"up":[157],"3.7":[159],"GFLOPS.":[160]},"counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
