{"id":"https://openalex.org/W2164864640","doi":"https://doi.org/10.1177/1094342013492178","title":"A case study in mechanically deriving dense linear algebra code","display_name":"A case study in mechanically deriving dense linear algebra code","publication_year":2013,"publication_date":"2013-06-19","ids":{"openalex":"https://openalex.org/W2164864640","doi":"https://doi.org/10.1177/1094342013492178","mag":"2164864640"},"language":"en","primary_location":{"id":"doi:10.1177/1094342013492178","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342013492178","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112034603","display_name":"Bryan Marker","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bryan Marker","raw_affiliation_strings":["Department of Computer Science, The University of Texas at Austin, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, The University of Texas at Austin, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033605569","display_name":"Don Batory","orcid":"https://orcid.org/0000-0002-8739-3841"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Don Batory","raw_affiliation_strings":["Department of Computer Science, The University of Texas at Austin, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, The University of Texas at Austin, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061722569","display_name":"Robert A. Geijn","orcid":"https://orcid.org/0009-0004-6434-8492"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Robert van de Geijn","raw_affiliation_strings":["Department of Computer Science, The University of Texas at Austin, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, The University of Texas at Austin, USA","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5112034603"],"corresponding_institution_ids":["https://openalex.org/I86519309"],"apc_list":null,"apc_paid":null,"fwci":2.2065,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.88563521,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"27","issue":"4","first_page":"440","last_page":"453"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12326","display_name":"Network Packet Processing and Optimization","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.6713611483573914},{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.6496589183807373},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.6447235345840454},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6445889472961426},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5869196653366089},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5778133869171143},{"id":"https://openalex.org/keywords/linear-map","display_name":"Linear map","score":0.5135055184364319},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.4873843789100647},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4814243018627167},{"id":"https://openalex.org/keywords/algebra-over-a-field","display_name":"Algebra over a field","score":0.4707774817943573},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4226161241531372},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.41810864210128784},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.398882657289505},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.39523404836654663},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.30218976736068726},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2132246494293213},{"id":"https://openalex.org/keywords/pure-mathematics","display_name":"Pure mathematics","score":0.15238678455352783},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.07395029067993164}],"concepts":[{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.6713611483573914},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.6496589183807373},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.6447235345840454},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6445889472961426},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5869196653366089},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5778133869171143},{"id":"https://openalex.org/C49766605","wikidata":"https://www.wikidata.org/wiki/Q207643","display_name":"Linear map","level":2,"score":0.5135055184364319},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.4873843789100647},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4814243018627167},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.4707774817943573},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4226161241531372},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.41810864210128784},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.398882657289505},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.39523404836654663},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30218976736068726},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2132246494293213},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.15238678455352783},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.07395029067993164},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/1094342013492178","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342013492178","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320338284","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63"},{"id":"https://openalex.org/F4320338291","display_name":"Sandia National Laboratories","ror":"https://ror.org/01apwpt12"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W60615445","https://openalex.org/W1480928214","https://openalex.org/W1541425587","https://openalex.org/W1589918049","https://openalex.org/W1923905519","https://openalex.org/W1947869163","https://openalex.org/W1988425770","https://openalex.org/W2002257715","https://openalex.org/W2038469228","https://openalex.org/W2052934867","https://openalex.org/W2054658678","https://openalex.org/W2077115703","https://openalex.org/W2077318760","https://openalex.org/W2093529653","https://openalex.org/W2109098465","https://openalex.org/W2135653967","https://openalex.org/W2136952590","https://openalex.org/W2148553714","https://openalex.org/W2162318968","https://openalex.org/W2169336925","https://openalex.org/W2187980931","https://openalex.org/W2914819579","https://openalex.org/W3106021326","https://openalex.org/W3136479147","https://openalex.org/W4205585823"],"related_works":["https://openalex.org/W2311164424","https://openalex.org/W4240580698","https://openalex.org/W2736536199","https://openalex.org/W1854939505","https://openalex.org/W4249933974","https://openalex.org/W2142325947","https://openalex.org/W4382178632","https://openalex.org/W2072901631","https://openalex.org/W1966987437","https://openalex.org/W2025912094"],"abstract_inverted_index":{"Design":[0],"by":[1],"Transformation":[2],"(DxT)":[3],"is":[4],"a":[5,25,35,44,55,108],"top-down":[6],"approach":[7],"to":[8,20,58,85],"mechanically":[9,101],"derive":[10,21],"high-performance":[11],"algorithms":[12],"for":[13,43,99],"dense":[14],"linear":[15],"algebra.":[16],"We":[17,32],"use":[18],"DxT":[19],"the":[22,49,60,69,78,90,100],"implementation":[23],"of":[24,38,47,72,89,107],"representative":[26],"matrix":[27],"operation,":[28],"two-":[29,63],"sided":[30,64],"Trmm.":[31,65],"start":[33],"with":[34],"knowledge":[36],"base":[37],"transformations":[39,57],"that":[40,93],"were":[41],"encoded":[42],"simpler":[45],"set":[46],"operations,":[48],"level-3":[50],"BLAS,":[51],"and":[52],"add":[53],"only":[54],"few":[56],"accommodate":[59],"more":[61],"complex":[62],"These":[66],"additions":[67],"explode":[68],"search":[70,91],"space":[71,92],"our":[73],"prototype":[74],"system,":[75],"DxTer,":[76],"requiring":[77],"novel":[79],"techniques":[80],"defined":[81],"in":[82],"this":[83],"paper":[84],"eliminate":[86],"large":[87],"segments":[88],"contain":[94],"suboptimal":[95],"algorithms.":[96],"Performance":[97],"results":[98],"optimized":[102],"implementations":[103],"on":[104],"8192":[105],"cores":[106],"BlueGene/P":[109],"architecture":[110],"are":[111],"given.":[112]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
