{"id":"https://openalex.org/W2260325244","doi":"https://doi.org/10.3233/978-1-61499-621-7-371","title":"A general tridiagonal solver for coprocessors: Adapting g-Spike for the Intel Xeon Phi","display_name":"A general tridiagonal solver for coprocessors: Adapting g-Spike for the Intel Xeon Phi","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2260325244","doi":"https://doi.org/10.3233/978-1-61499-621-7-371","mag":"2260325244"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-621-7-371","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-371","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064764358","display_name":"Ioannis E. Venetis","orcid":"https://orcid.org/0000-0002-0022-0447"},"institutions":[{"id":"https://openalex.org/I174878644","display_name":"University of Patras","ror":"https://ror.org/017wvtq80","country_code":"GR","type":"education","lineage":["https://openalex.org/I174878644"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Venetis Ioannis E.","raw_affiliation_strings":["University of Patras, P\u00e1trai, Greece"],"affiliations":[{"raw_affiliation_string":"University of Patras, P\u00e1trai, Greece","institution_ids":["https://openalex.org/I174878644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026282863","display_name":"Alexandros Sobczyk","orcid":null},"institutions":[{"id":"https://openalex.org/I174878644","display_name":"University of Patras","ror":"https://ror.org/017wvtq80","country_code":"GR","type":"education","lineage":["https://openalex.org/I174878644"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Sobczyk Alexandros","raw_affiliation_strings":["University of Patras, P\u00e1trai, Greece"],"affiliations":[{"raw_affiliation_string":"University of Patras, P\u00e1trai, Greece","institution_ids":["https://openalex.org/I174878644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102929943","display_name":"Alexandros Kouris","orcid":"https://orcid.org/0000-0002-2900-430X"},"institutions":[{"id":"https://openalex.org/I174878644","display_name":"University of Patras","ror":"https://ror.org/017wvtq80","country_code":"GR","type":"education","lineage":["https://openalex.org/I174878644"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Kouris Alexandros","raw_affiliation_strings":["University of Patras, P\u00e1trai, Greece"],"affiliations":[{"raw_affiliation_string":"University of Patras, P\u00e1trai, Greece","institution_ids":["https://openalex.org/I174878644"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089741556","display_name":"\u0391\u03bb\u03ad\u03be\u03b1\u03bd\u03b4\u03c1\u03bf\u03c2 \u039d\u03ac\u03ba\u03bf\u03c2","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakos Alexandros","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052892039","display_name":"Nikolaos Nikoloutsakos","orcid":null},"institutions":[{"id":"https://openalex.org/I174878644","display_name":"University of Patras","ror":"https://ror.org/017wvtq80","country_code":"GR","type":"education","lineage":["https://openalex.org/I174878644"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Nikoloutsakos Nikolaos","raw_affiliation_strings":["University of Patras, P\u00e1trai, Greece"],"affiliations":[{"raw_affiliation_string":"University of Patras, P\u00e1trai, Greece","institution_ids":["https://openalex.org/I174878644"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061247746","display_name":"Efstratios Gallopoulos","orcid":"https://orcid.org/0000-0002-1506-9727"},"institutions":[{"id":"https://openalex.org/I174878644","display_name":"University of Patras","ror":"https://ror.org/017wvtq80","country_code":"GR","type":"education","lineage":["https://openalex.org/I174878644"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Gallopoulos Efstratios","raw_affiliation_strings":["University of Patras, P\u00e1trai, Greece"],"affiliations":[{"raw_affiliation_string":"University of Patras, P\u00e1trai, Greece","institution_ids":["https://openalex.org/I174878644"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064764358"],"corresponding_institution_ids":["https://openalex.org/I174878644"],"apc_list":null,"apc_paid":null,"fwci":1.2646,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.75851703,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.954200029373169,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.8757704496383667},{"id":"https://openalex.org/keywords/tridiagonal-matrix","display_name":"Tridiagonal matrix","score":0.7303034067153931},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.7039568424224854},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.6433517932891846},{"id":"https://openalex.org/keywords/spike","display_name":"Spike (software development)","score":0.5584624409675598},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5008187294006348},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4940202832221985},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11282795667648315},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10632827877998352},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.04777446389198303}],"concepts":[{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.8757704496383667},{"id":"https://openalex.org/C51647924","wikidata":"https://www.wikidata.org/wiki/Q1755277","display_name":"Tridiagonal matrix","level":3,"score":0.7303034067153931},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.7039568424224854},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.6433517932891846},{"id":"https://openalex.org/C2781390188","wikidata":"https://www.wikidata.org/wiki/Q25203449","display_name":"Spike (software development)","level":2,"score":0.5584624409675598},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5008187294006348},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4940202832221985},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11282795667648315},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10632827877998352},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.04777446389198303},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/978-1-61499-621-7-371","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-371","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.6299999952316284,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2213533160","https://openalex.org/W2467043670","https://openalex.org/W2051273732","https://openalex.org/W3203561460","https://openalex.org/W4252450863","https://openalex.org/W2022867993","https://openalex.org/W2051078434","https://openalex.org/W1554208380","https://openalex.org/W2682544458","https://openalex.org/W2075846137"],"abstract_inverted_index":{"Manycores":[0],"like":[1,10],"the":[2,11,60,90,97,137,151,155,160,164,168,174],"Intel":[3],"Xeon":[4,98,156],"Phi":[5,157],"and":[6,64,92,167,181],"graphics":[7],"processing":[8,182],"units":[9],"NVIDIA":[12],"Tesla":[13],"series":[14],"are":[15,67],"prime":[16],"examples":[17],"of":[18,32,47,62,89,94,159],"systems":[19,108,120],"for":[20,96,121,178],"accelerating":[21],"applications":[22],"that":[23,66],"run":[24],"on":[25,109,111,136,154],"current":[26],"CPU":[27],"multicores.":[28],"It":[29],"is":[30,46,134],"therefore":[31],"interest":[33,48],"to":[34,49,58,73,84,104],"build":[35],"fast,":[36],"reliable":[37],"linear":[38],"system":[39],"solvers":[40,128],"targeting":[41],"these":[42],"architectures.":[43],"Moreover,":[44],"it":[45,113],"conduct":[50],"cross":[51],"comparisons":[52],"between":[53],"algorithmic":[54],"implementations":[55],"in":[56,71,75,163],"order":[57,72],"organize":[59],"types":[61],"optimizations":[63],"transformations":[65],"necessary":[68,152],"when":[69],"porting":[70],"succeed":[74],"obtaining":[76],"performance":[77,116,176],"portability.":[78],"In":[79],"this":[80],"work":[81],"we":[82],"aim":[83],"present":[85],"a":[86],"detailed":[87],"study":[88],"adaptation":[91],"implementation":[93],"g-Spike":[95,100],"Phi.":[99],"was":[101],"originally":[102],"developed":[103],"solve":[105],"general":[106,125],"tridiagonal":[107,126],"GPUs,":[110],"which":[112,122],"returns":[114],"high":[115],"while":[117],"also":[118],"solving":[119],"other":[123],"state-of-the-art":[124],"GPU":[127],"do":[129],"not":[130],"succeed.":[131],"The":[132],"solver":[133],"based":[135],"Spike":[138],"framework,":[139],"using":[140],"QR":[141],"factorization":[142],"without":[143],"pivoting":[144],"implemented":[145],"via":[146],"Givens":[147],"rotations.":[148],"We":[149],"show":[150],"adaptations":[153],"because":[158],"significant":[161],"differences":[162,177],"programming":[165],"models":[166],"underlying":[169],"architectures":[170],"as":[171,173],"well":[172],"relative":[175],"data":[179],"access":[180],"operations.":[183]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2016-06-24T00:00:00"}
