{"id":"https://openalex.org/W2159844683","doi":"https://doi.org/10.1145/2133352.2133358","title":"Portable and scalable FPGA-based acceleration of a direct linear system solver","display_name":"Portable and scalable FPGA-based acceleration of a direct linear system solver","publication_year":2012,"publication_date":"2012-03-01","ids":{"openalex":"https://openalex.org/W2159844683","doi":"https://doi.org/10.1145/2133352.2133358","mag":"2159844683"},"language":"en","primary_location":{"id":"doi:10.1145/2133352.2133358","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2133352.2133358","pdf_url":null,"source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5118983736","display_name":"Wei Zhang","orcid":"https://orcid.org/0009-0007-9625-1697"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["University of Toronto, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Toronto, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030184404","display_name":"Vaughn Betz","orcid":"https://orcid.org/0000-0003-0528-6493"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Vaughn Betz","raw_affiliation_strings":["University of Toronto, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Toronto, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090184149","display_name":"Jonathan Rose","orcid":"https://orcid.org/0000-0002-3551-2175"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jonathan Rose","raw_affiliation_strings":["University of Toronto, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Toronto, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5118983736"],"corresponding_institution_ids":["https://openalex.org/I185261750"],"apc_list":null,"apc_paid":null,"fwci":6.6713,"has_fulltext":false,"cited_by_count":42,"citation_normalized_percentile":{"value":0.97292486,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"5","issue":"1","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8640561103820801},{"id":"https://openalex.org/keywords/stratix","display_name":"Stratix","score":0.823951244354248},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.8025988936424255},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6079403162002563},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.5784258246421814},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5425750017166138},{"id":"https://openalex.org/keywords/fpga-prototype","display_name":"FPGA prototype","score":0.4629645347595215},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.36750656366348267},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3654361367225647},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2043907344341278}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8640561103820801},{"id":"https://openalex.org/C2776277307","wikidata":"https://www.wikidata.org/wiki/Q22074755","display_name":"Stratix","level":3,"score":0.823951244354248},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.8025988936424255},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6079403162002563},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.5784258246421814},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5425750017166138},{"id":"https://openalex.org/C203864433","wikidata":"https://www.wikidata.org/wiki/Q5426992","display_name":"FPGA prototype","level":3,"score":0.4629645347595215},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.36750656366348267},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3654361367225647},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2043907344341278}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2133352.2133358","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2133352.2133358","pdf_url":null,"source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W31398948","https://openalex.org/W1552224009","https://openalex.org/W1553214226","https://openalex.org/W1596300602","https://openalex.org/W1820726733","https://openalex.org/W1977221636","https://openalex.org/W1981252059","https://openalex.org/W1991973578","https://openalex.org/W2014066893","https://openalex.org/W2063186542","https://openalex.org/W2094056072","https://openalex.org/W2107971623","https://openalex.org/W2132367502","https://openalex.org/W2136897996","https://openalex.org/W2137994790","https://openalex.org/W2143386935","https://openalex.org/W2149381887","https://openalex.org/W2152567198","https://openalex.org/W4238913942","https://openalex.org/W4248073216"],"related_works":["https://openalex.org/W1509155667","https://openalex.org/W2518118925","https://openalex.org/W2998132311","https://openalex.org/W3208151864","https://openalex.org/W2207067480","https://openalex.org/W4383823603","https://openalex.org/W1692883217","https://openalex.org/W2406926880","https://openalex.org/W2332075903","https://openalex.org/W1579891439"],"abstract_inverted_index":{"FPGAs":[0],"have":[1,28,77],"the":[2,17,33,67,70,84,101,119,130,138,152,161,168,173,190,202,210,217,225,242],"potential":[3],"to":[4,58,115,183],"serve":[5],"as":[6],"a":[7,97,124,133,184,196,233],"platform":[8],"for":[9,25,88,99],"accelerating":[10],"many":[11,41],"computations":[12],"including":[13],"scientific":[14,34,38],"applications.":[15],"However,":[16],"large":[18],"development":[19],"cost":[20],"and":[21,40,105,137,155,224,249],"short":[22],"life":[23],"span":[24],"FPGA":[26,153,170,218,243],"designs":[27],"limited":[29],"their":[30],"adoption":[31],"by":[32],"computing":[35,39,45],"community.":[36],"FPGA-based":[37,60],"kinds":[42],"of":[43,69,91,132,163,175,212,235],"embedded":[44],"could":[46],"become":[47],"more":[48,252],"practical":[49],"if":[50,111],"there":[51],"were":[52,56],"hardware":[53,143],"libraries":[54,113],"that":[55,64,107,127,150],"portable":[57,104],"any":[59],"system":[61],"with":[62,66],"performance":[63,162],"scaled":[65],"size":[68],"FPGA.":[71],"To":[72],"illustrate":[73],"this":[74,176],"idea":[75],"we":[76],"implemented":[78],"one":[79],"common":[80],"super-computing":[81],"library":[82],"function:":[83],"LU":[85],"factorization":[86],"method":[87,98],"solving":[89],"systems":[90],"linear":[92],"equations.":[93],"This":[94],"paper":[95],"describes":[96],"making":[100],"design":[102,122],"both":[103,129],"scalable":[106],"should":[108],"be":[109,116],"illustrative":[110],"such":[112],"are":[114],"built":[117],"in":[118,141,189],"future.":[120],"The":[121,146],"is":[123,220,232,245],"software-based":[125],"generator":[126,147],"leverages":[128],"flexibility":[131],"software":[134,199],"programming":[135],"language":[136],"parameters":[139,149],"inherent":[140],"an":[142],"description":[144],"language.":[145],"accepts":[148],"describe":[151],"capacity":[154],"external":[156],"memory":[157],"capabilities.":[158],"We":[159],"compare":[160],"our":[164],"engine":[165],"executing":[166],"on":[167,209],"largest":[169],"available":[171],"at":[172],"time":[174],"work":[177],"(an":[178],"Altera":[179],"Stratix":[180],"III":[181],"3S340)":[182],"single":[185,206],"processor":[186,203],"core":[187],"fabricated":[188],"same":[191],"65nm":[192],"IC":[193],"process":[194],"running":[195],"highly":[197],"optimized":[198],"implementation":[200,219,244],"from":[201],"vendor.":[204],"For":[205,239],"precision":[207],"matrices":[208],"order":[211],"10,000":[213,215],"\u00d7":[214],"elements,":[216],"2.2":[221],"times":[222,237,247,251],"faster":[223,248],"energy":[226,253],"dissipated":[227],"per":[228],"useful":[229],"GFLOP":[230],"operation":[231],"factor":[234],"5":[236],"less.":[238],"double":[240],"precision,":[241],"1.7":[246],"3.5":[250],"efficient.":[254]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
