{"id":"https://openalex.org/W2345127431","doi":"https://doi.org/10.1109/tpds.2016.2516988","title":"A Hybrid Parallel Solving Algorithm on GPU for Quasi-Tridiagonal System of Linear Equations","display_name":"A Hybrid Parallel Solving Algorithm on GPU for Quasi-Tridiagonal System of Linear Equations","publication_year":2016,"publication_date":"2016-01-12","ids":{"openalex":"https://openalex.org/W2345127431","doi":"https://doi.org/10.1109/tpds.2016.2516988","mag":"2345127431"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2016.2516988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2516988","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078793726","display_name":"Kenli Li","orcid":"https://orcid.org/0000-0002-2635-7716"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]},{"id":"https://openalex.org/I157455823","display_name":"SUNY New Paltz","ror":"https://ror.org/03j3dv688","country_code":"US","type":"education","lineage":["https://openalex.org/I157455823"]}],"countries":["CN","US"],"is_corresponding":true,"raw_author_name":"Kenli Li","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","Department of Computer Science, State University of New York, New Paltz, New York","National Supercomputing Center in Changsha, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"Department of Computer Science, State University of New York, New Paltz, New York","institution_ids":["https://openalex.org/I157455823"]},{"raw_affiliation_string":"National Supercomputing Center in Changsha, Changsha, Hunan, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016247312","display_name":"Wangdong Yang","orcid":"https://orcid.org/0000-0003-2681-7898"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wangdong Yang","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","National Supercomputing Center in Changsha, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"National Supercomputing Center in Changsha, Changsha, Hunan, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087894632","display_name":"Keqin Li","orcid":"https://orcid.org/0000-0001-5224-4048"},"institutions":[{"id":"https://openalex.org/I157455823","display_name":"SUNY New Paltz","ror":"https://ror.org/03j3dv688","country_code":"US","type":"education","lineage":["https://openalex.org/I157455823"]},{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Keqin Li","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","Department of Computer Science, State University of New York, New Paltz, New York","National Supercomputing Center in Changsha, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"Department of Computer Science, State University of New York, New Paltz, New York","institution_ids":["https://openalex.org/I157455823"]},{"raw_affiliation_string":"National Supercomputing Center in Changsha, Changsha, Hunan, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5078793726"],"corresponding_institution_ids":["https://openalex.org/I157455823","https://openalex.org/I16609230"],"apc_list":null,"apc_paid":null,"fwci":7.1874,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.97110844,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"27","issue":"10","first_page":"2795","last_page":"2808"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11435","display_name":"Polynomial and algebraic computation","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10963","display_name":"Advanced Optimization Algorithms Research","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/2612","display_name":"Numerical Analysis"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tridiagonal-matrix","display_name":"Tridiagonal matrix","score":0.9550120830535889},{"id":"https://openalex.org/keywords/tridiagonal-matrix-algorithm","display_name":"Tridiagonal matrix algorithm","score":0.8247369527816772},{"id":"https://openalex.org/keywords/alternating-direction-implicit-method","display_name":"Alternating direction implicit method","score":0.6094324588775635},{"id":"https://openalex.org/keywords/linear-system","display_name":"Linear system","score":0.5890617966651917},{"id":"https://openalex.org/keywords/system-of-linear-equations","display_name":"System of linear equations","score":0.5890482068061829},{"id":"https://openalex.org/keywords/generalized-minimal-residual-method","display_name":"Generalized minimal residual method","score":0.5717735886573792},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5566869378089905},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5148095488548279},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.49209731817245483},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.49091392755508423},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.46308666467666626},{"id":"https://openalex.org/keywords/biconjugate-gradient-stabilized-method","display_name":"Biconjugate gradient stabilized method","score":0.45345398783683777},{"id":"https://openalex.org/keywords/crank\u2013nicolson-method","display_name":"Crank\u2013Nicolson method","score":0.4334664046764374},{"id":"https://openalex.org/keywords/linear-equation","display_name":"Linear equation","score":0.4103235602378845},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4042072296142578},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.38733452558517456},{"id":"https://openalex.org/keywords/numerical-analysis","display_name":"Numerical analysis","score":0.28154256939888},{"id":"https://openalex.org/keywords/finite-difference-method","display_name":"Finite difference method","score":0.15160465240478516},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.10277929902076721}],"concepts":[{"id":"https://openalex.org/C51647924","wikidata":"https://www.wikidata.org/wiki/Q1755277","display_name":"Tridiagonal matrix","level":3,"score":0.9550120830535889},{"id":"https://openalex.org/C176603272","wikidata":"https://www.wikidata.org/wiki/Q1819156","display_name":"Tridiagonal matrix algorithm","level":4,"score":0.8247369527816772},{"id":"https://openalex.org/C142363948","wikidata":"https://www.wikidata.org/wiki/Q4736413","display_name":"Alternating direction implicit method","level":3,"score":0.6094324588775635},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.5890617966651917},{"id":"https://openalex.org/C94523830","wikidata":"https://www.wikidata.org/wiki/Q11203","display_name":"System of linear equations","level":2,"score":0.5890482068061829},{"id":"https://openalex.org/C155332342","wikidata":"https://www.wikidata.org/wiki/Q1432976","display_name":"Generalized minimal residual method","level":3,"score":0.5717735886573792},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5566869378089905},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5148095488548279},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.49209731817245483},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.49091392755508423},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.46308666467666626},{"id":"https://openalex.org/C120553275","wikidata":"https://www.wikidata.org/wiki/Q4903720","display_name":"Biconjugate gradient stabilized method","level":3,"score":0.45345398783683777},{"id":"https://openalex.org/C180931078","wikidata":"https://www.wikidata.org/wiki/Q588725","display_name":"Crank\u2013Nicolson method","level":3,"score":0.4334664046764374},{"id":"https://openalex.org/C77346573","wikidata":"https://www.wikidata.org/wiki/Q484637","display_name":"Linear equation","level":2,"score":0.4103235602378845},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4042072296142578},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.38733452558517456},{"id":"https://openalex.org/C48753275","wikidata":"https://www.wikidata.org/wiki/Q11216","display_name":"Numerical analysis","level":2,"score":0.28154256939888},{"id":"https://openalex.org/C205951836","wikidata":"https://www.wikidata.org/wiki/Q1147751","display_name":"Finite difference method","level":2,"score":0.15160465240478516},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.10277929902076721},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2016.2516988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2516988","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2243909624","display_name":null,"funder_award_id":"61133005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2707076737","display_name":null,"funder_award_id":"61432005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G30034585","display_name":null,"funder_award_id":"61572175","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G662528876","display_name":null,"funder_award_id":"61472124","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6925281636","display_name":null,"funder_award_id":"61370095","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W107275210","https://openalex.org/W825382763","https://openalex.org/W1506342804","https://openalex.org/W1513335789","https://openalex.org/W1526797232","https://openalex.org/W1531019619","https://openalex.org/W1968586345","https://openalex.org/W1974312429","https://openalex.org/W1990523337","https://openalex.org/W2003117296","https://openalex.org/W2006850990","https://openalex.org/W2014730252","https://openalex.org/W2017838066","https://openalex.org/W2018380021","https://openalex.org/W2025890876","https://openalex.org/W2031032655","https://openalex.org/W2034258707","https://openalex.org/W2041057519","https://openalex.org/W2043990347","https://openalex.org/W2053999255","https://openalex.org/W2068155564","https://openalex.org/W2068166782","https://openalex.org/W2070169282","https://openalex.org/W2082238959","https://openalex.org/W2090593986","https://openalex.org/W2111000503","https://openalex.org/W2112185810","https://openalex.org/W2143873431","https://openalex.org/W2160406723","https://openalex.org/W2170802276","https://openalex.org/W2183156981","https://openalex.org/W2400350896","https://openalex.org/W4245994617","https://openalex.org/W4247995867","https://openalex.org/W4285719527","https://openalex.org/W6604266063"],"related_works":["https://openalex.org/W1620763245","https://openalex.org/W2486238093","https://openalex.org/W1510662217","https://openalex.org/W2371875888","https://openalex.org/W2592349247","https://openalex.org/W2130308425","https://openalex.org/W2043555141","https://openalex.org/W1987868570","https://openalex.org/W2015301863","https://openalex.org/W1996996069"],"abstract_inverted_index":{"There":[0],"are":[1,101,145],"some":[2,13],"quasi-tridiagonal":[3,21,61,113],"system":[4,22,114],"of":[5,23,30,35,110,115,157,171,192,204,222,231,234],"linear":[6,24,116],"equations":[7,25,117,136],"arising":[8],"from":[9],"numerical":[10],"simulations,":[11],"and":[12,46,49,69,76,139,185,188,195,212,227],"solving":[14,20,41,111],"algorithms":[15],"encounter":[16],"great":[17],"challenge":[18],"on":[19,137,164],"with":[26,181],"more":[27],"than":[28,220],"millions":[29],"dimensions":[31],"as":[32,151],"the":[33,78,85,89,93,98,104,107,112,140,155,168,200,213,223],"scale":[34],"problems":[36],"increases.":[37],"We":[38],"present":[39,123],"a":[40,57,66,70,130],"method":[42,51,75,179,206,217],"which":[43],"mixes":[44],"direct":[45,86,99,228],"iterative":[47,226],"methods,":[48],"our":[50,74,162,178,205,216],"needs":[52],"less":[53,232],"storage":[54],"space":[55],"in":[56,88,143,147,236],"computing":[58,144,202],"process.":[59],"A":[60],"matrix":[62,68,72],"is":[63,173,207,218],"split":[64],"into":[65],"tridiagonal":[67,79,135],"sparse":[71],"using":[73,129,177,215],"then":[77],"equation":[80],"can":[81,118],"be":[82,119],"solved":[83],"by":[84,97,176,209],"methods":[87,100,229],"iteration":[90],"processes.":[91],"Because":[92],"approximate":[94],"solutions":[95],"obtained":[96],"closer":[102],"to":[103,133,152,161,190],"exact":[105],"solutions,":[106],"convergence":[108],"speed":[109],"improved.":[120],"Furthermore,":[121],"we":[122],"an":[124,237],"improved":[125],"cyclic":[126],"reduction":[127],"algorithm":[128],"partition":[131,210],"strategy":[132],"solve":[134],"GPU,":[138],"intermediate":[141],"data":[142],"stored":[146],"shared":[148],"memory":[149,158],"so":[150],"significantly":[153,175],"reduce":[154],"latency":[156],"access.":[159],"According":[160],"experiments":[163],"10":[165],"test":[166],"cases,":[167],"average":[169],"number":[170],"iterations":[172],"reduced":[174],"compared":[180],"Jacobi,":[182],"GS,":[183],"GMRES,":[184],"BiCG":[186],"respectively,":[187],"close":[189],"those":[191,221],"BiCGSTAB,":[193],"BiCRSTAB,":[194],"TFQMR.":[196],"For":[197],"parallel":[198,201],"mode,":[199],"efficiency":[203],"raised":[208],"strategy,":[211],"performance":[214],"better":[219],"commonly":[224],"used":[225],"because":[230],"amount":[233],"calculation":[235],"iteration.":[238]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
