{"id":"https://openalex.org/W2795195674","doi":"https://doi.org/10.3233/978-1-61499-843-3-329","title":"GPU-Accelerated and Storage-Efficient Implementation of the QR Decomposition","display_name":"GPU-Accelerated and Storage-Efficient Implementation of the QR Decomposition","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2795195674","doi":"https://doi.org/10.3233/978-1-61499-843-3-329","mag":"2795195674"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-843-3-329","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-329","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Benner Peter","orcid":null},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210127568","display_name":"Max Planck Institute for Dynamics of Complex Technical Systems","ror":"https://ror.org/030h7k016","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210127568"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Benner Peter","raw_affiliation_strings":["Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society"],"affiliations":[{"raw_affiliation_string":"Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society","institution_ids":["https://openalex.org/I4210127568","https://openalex.org/I149899117"]}]},{"author_position":"middle","author":{"id":null,"display_name":"K&ouml;hler Martin","orcid":null},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210127568","display_name":"Max Planck Institute for Dynamics of Complex Technical Systems","ror":"https://ror.org/030h7k016","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210127568"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"K&ouml;hler Martin","raw_affiliation_strings":["Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society"],"affiliations":[{"raw_affiliation_string":"Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society","institution_ids":["https://openalex.org/I4210127568","https://openalex.org/I149899117"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055114787","display_name":"Carolin Penke","orcid":"https://orcid.org/0000-0002-4043-3885"},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210127568","display_name":"Max Planck Institute for Dynamics of Complex Technical Systems","ror":"https://ror.org/030h7k016","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210127568"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Penke Carolin","raw_affiliation_strings":["Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society"],"affiliations":[{"raw_affiliation_string":"Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society","institution_ids":["https://openalex.org/I4210127568","https://openalex.org/I149899117"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I149899117","https://openalex.org/I4210127568"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04955152,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9218000173568726,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9218000173568726,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.6922489404678345},{"id":"https://openalex.org/keywords/qr-decomposition","display_name":"QR decomposition","score":0.6302200555801392},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5894495844841003},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.44425535202026367},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3514034152030945},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.19651204347610474},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10382053256034851}],"concepts":[{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.6922489404678345},{"id":"https://openalex.org/C188060507","wikidata":"https://www.wikidata.org/wiki/Q653242","display_name":"QR decomposition","level":3,"score":0.6302200555801392},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5894495844841003},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.44425535202026367},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3514034152030945},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.19651204347610474},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10382053256034851},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/978-1-61499-843-3-329","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-329","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W1485846902","https://openalex.org/W3037218165","https://openalex.org/W2390279801","https://openalex.org/W2982181895","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W1980464854"],"abstract_inverted_index":{"The":[0,49,70],"LAPACK":[1,108],"routines":[2],"GEQRT2":[3],"and":[4,79,122],"GEQRT3":[5],"can":[6],"be":[7],"used":[8,53],"to":[9,43,56,65,95],"compute":[10,44],"the":[11,23,27,45,60,98,103,106],"QR":[12,41],"decomposition":[13,42],"of":[14,17,26,59,68,113,126],"a":[15,37,91,101,111,119,124],"matrix":[16,47,61],"size":[18],"m&amp;times;n":[19],"as":[20,22],"well":[21],"storage-efficient":[24,50],"representation":[25,51],"orthogonal":[28],"factor.":[29],"A":[30],"GPU-accelerated":[31],"algorithm":[32,71,104],"is":[33,52,72,93],"presented":[34,73],"that":[35],"expands":[36],"blocked":[38],"CPU-GPU":[39],"hybrid":[40],"triangular":[46],"T.":[48],"in":[54,74],"particular":[55],"access":[57],"blocks":[58],"Q":[62],"without":[63],"having":[64],"generate":[66],"all":[67],"it.":[69],"two":[75,80,129],"variants":[76],"using":[77],"one":[78],"GPUs,":[81],"respectively.":[82],"To":[83],"avoid":[84],"redundant":[85],"computations":[86],"or":[87],"communication":[88],"between":[89],"devices,":[90],"scheme":[92],"developed":[94],"additionally":[96],"computeduring":[97],"iteration.":[99],"As":[100],"result":[102],"outperforms":[105],"standard":[107],"routine":[109],"by":[110,123],"factor":[112,125],"3":[114],"for":[115],"square":[116],"matrices":[117],"on":[118,128],"single":[120],"GPU":[121],"5":[127],"GPUs.":[130]},"counts_by_year":[],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2018-04-06T00:00:00"}
