{"id":"https://openalex.org/W3172632304","doi":"https://doi.org/10.1109/ieeeconf51394.2020.9443541","title":"Towards the Basic Linear Algebra Unit : Replicating multi-dimensional FPUs to accelerate linear algebra applications","display_name":"Towards the Basic Linear Algebra Unit : Replicating multi-dimensional FPUs to accelerate linear algebra applications","publication_year":2020,"publication_date":"2020-11-01","ids":{"openalex":"https://openalex.org/W3172632304","doi":"https://doi.org/10.1109/ieeeconf51394.2020.9443541","mag":"3172632304"},"language":"en","primary_location":{"id":"doi:10.1109/ieeeconf51394.2020.9443541","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ieeeconf51394.2020.9443541","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 54th Asilomar Conference on Signals, Systems, and Computers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039376838","display_name":"Nicolas Brunie","orcid":"https://orcid.org/0000-0003-2314-443X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Nicolas Brunie","raw_affiliation_strings":["Kalray, Montbonnot-Saint-Martin, France"],"affiliations":[{"raw_affiliation_string":"Kalray, Montbonnot-Saint-Martin, France","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5039376838"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4621,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.63937282,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1283","last_page":"1290"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6780744791030884},{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.6533016562461853},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5752652883529663},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.5623750686645508},{"id":"https://openalex.org/keywords/floating-point-unit","display_name":"Floating-point unit","score":0.5490310192108154},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.48670366406440735},{"id":"https://openalex.org/keywords/arithmetic-logic-unit","display_name":"Arithmetic logic unit","score":0.4770369231700897},{"id":"https://openalex.org/keywords/chip","display_name":"Chip","score":0.42177531123161316},{"id":"https://openalex.org/keywords/arbitrary-precision-arithmetic","display_name":"Arbitrary-precision arithmetic","score":0.4214499890804291},{"id":"https://openalex.org/keywords/elementary-algebra","display_name":"Elementary algebra","score":0.4149687886238098},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.3061869740486145},{"id":"https://openalex.org/keywords/algebra-over-a-field","display_name":"Algebra over a field","score":0.29285869002342224},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21267834305763245},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14223790168762207}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6780744791030884},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.6533016562461853},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5752652883529663},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.5623750686645508},{"id":"https://openalex.org/C110305270","wikidata":"https://www.wikidata.org/wiki/Q733507","display_name":"Floating-point unit","level":3,"score":0.5490310192108154},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.48670366406440735},{"id":"https://openalex.org/C100276221","wikidata":"https://www.wikidata.org/wiki/Q192903","display_name":"Arithmetic logic unit","level":2,"score":0.4770369231700897},{"id":"https://openalex.org/C165005293","wikidata":"https://www.wikidata.org/wiki/Q1074500","display_name":"Chip","level":2,"score":0.42177531123161316},{"id":"https://openalex.org/C83581934","wikidata":"https://www.wikidata.org/wiki/Q527381","display_name":"Arbitrary-precision arithmetic","level":2,"score":0.4214499890804291},{"id":"https://openalex.org/C92087941","wikidata":"https://www.wikidata.org/wiki/Q211294","display_name":"Elementary algebra","level":3,"score":0.4149687886238098},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.3061869740486145},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.29285869002342224},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21267834305763245},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14223790168762207},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ieeeconf51394.2020.9443541","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ieeeconf51394.2020.9443541","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 54th Asilomar Conference on Signals, Systems, and Computers","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1506162491","https://openalex.org/W2018758602","https://openalex.org/W2113893001","https://openalex.org/W2122696945","https://openalex.org/W2252007067","https://openalex.org/W2545221752","https://openalex.org/W2606722458","https://openalex.org/W2751699127","https://openalex.org/W3152567310"],"related_works":["https://openalex.org/W2797902698","https://openalex.org/W2116803521","https://openalex.org/W2363539709","https://openalex.org/W4383333895","https://openalex.org/W3215589575","https://openalex.org/W1996200942","https://openalex.org/W1482601373","https://openalex.org/W2551094850","https://openalex.org/W2553713956","https://openalex.org/W4243574357"],"abstract_inverted_index":{"The":[0],"ever":[1],"improving":[2],"silicon":[3],"process":[4],"nodes":[5],"have":[6],"provided":[7],"chip":[8],"manufacturer":[9],"with":[10,84,152,194],"a":[11,22,101],"large":[12],"available":[13],"area.":[14,49],"Once":[15],"very":[16],"expensive,":[17],"floating-point":[18],"units":[19,169],"now":[20],"constitute":[21],"small":[23],"portion":[24],"of":[25,29,61,63,73,91,104,139,149,167],"the":[26,38,71,89,109,140,147,183,199],"overall":[27],"area":[28],"modern":[30],"general":[31,128],"purpose":[32,129],"processors.":[33],"In":[34],"arithmetic":[35,69,122,143,161,175,185],"heavy":[36],"workloads,":[37],"processor":[39,141,184],"peak":[40,59],"performance":[41,60,79],"is":[42],"still":[43],"directly":[44],"proportional":[45],"to":[46,57,197],"this":[47],"effective":[48],"Chip":[50],"manufacturers":[51],"are":[52],"always":[53],"looking":[54],"at":[55],"ways":[56],"improve":[58],"each":[62],"their":[64],"compute":[65],"core.":[66],"For":[67],"regular":[68],"application,":[70],"introduction":[72],"vector":[74,92,130,158],"extensions":[75,106,193],"in":[76,127,170],"ISA":[77],"brought":[78],"increases":[80],"which":[81],"linearly":[82],"scale":[83],"core's":[85],"memory":[86,202],"bandwidth.":[87],"Though,":[88],"size":[90],"has":[93],"reached":[94],"technical":[95],"and":[96,115,132,160],"usability":[97],"limits.":[98],"We":[99,145,163,177],"suggest":[100],"new":[102,121],"type":[103],"architectural":[105],"for":[107,173,180],"CPU:":[108],"Basic":[110],"Linear":[111],"Algebra":[112],"Unit":[113],"instructions":[114],"associated":[116],"execution":[117],"unit":[118],"(BLAU).":[119],"This":[120],"architecture":[123],"considers":[124],"packing":[125],"matrices":[126,150],"registers":[131,159],"implementing":[133],"elementary":[134],"matrix":[135],"operations":[136],"as":[137],"part":[138],"standard":[142],"pipeline.":[144,162],"study":[146],"dimensions":[148],"compatible":[151],"integration":[153],"into":[154],"General":[155],"Purpose":[156],"Processor":[157],"introduce":[164],"feasible":[165],"implementations":[166],"such":[168,192],"current":[171],"technologies":[172],"various":[174],"formats.":[176],"show":[178],"that,":[179],"specific":[181],"applications,":[182],"efficiency":[186],"can":[187],"be":[188],"greatly":[189],"increased":[190],"by":[191],"algorithmic":[195],"technics":[196],"limit":[198],"impact":[200],"on":[201],"bandwidth":[203],"usage.":[204]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
