{"id":"https://openalex.org/W2575851384","doi":"https://doi.org/10.3233/978-1-61499-621-7-361","title":"High Performance Eigenvalue Solver in Exact-diagonalization Method for Hubbard Model on CUDA GPU","display_name":"High Performance Eigenvalue Solver in Exact-diagonalization Method for Hubbard Model on CUDA GPU","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2575851384","doi":"https://doi.org/10.3233/978-1-61499-621-7-361","mag":"2575851384"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-621-7-361","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-361","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006749613","display_name":"Susumu Yamada","orcid":"https://orcid.org/0000-0003-0236-7124"},"institutions":[{"id":"https://openalex.org/I117197279","display_name":"Japan Atomic Energy Agency","ror":"https://ror.org/05nf86y53","country_code":"JP","type":"funder","lineage":["https://openalex.org/I117197279"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yamada Susumu","raw_affiliation_strings":["Japan Atomic Energy Agency, T\u014dkai Mura, Japan"],"affiliations":[{"raw_affiliation_string":"Japan Atomic Energy Agency, T\u014dkai Mura, Japan","institution_ids":["https://openalex.org/I117197279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086152822","display_name":"Toshiyuki Imamura","orcid":"https://orcid.org/0000-0003-1601-9710"},"institutions":[{"id":"https://openalex.org/I20529979","display_name":"University of Electro-Communications","ror":"https://ror.org/02x73b849","country_code":"JP","type":"education","lineage":["https://openalex.org/I20529979"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Imamura Toshiyuki","raw_affiliation_strings":["University of Electro-Communications, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"University of Electro-Communications, Tokyo, Japan","institution_ids":["https://openalex.org/I20529979"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010173270","display_name":"Masahiko Machida","orcid":null},"institutions":[{"id":"https://openalex.org/I117197279","display_name":"Japan Atomic Energy Agency","ror":"https://ror.org/05nf86y53","country_code":"JP","type":"funder","lineage":["https://openalex.org/I117197279"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Machida Masahiko","raw_affiliation_strings":["Japan Atomic Energy Agency, T\u014dkai Mura, Japan"],"affiliations":[{"raw_affiliation_string":"Japan Atomic Energy Agency, T\u014dkai Mura, Japan","institution_ids":["https://openalex.org/I117197279"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5006749613"],"corresponding_institution_ids":["https://openalex.org/I117197279"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.29612652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"361","last_page":"369"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9437999725341797,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9437999725341797,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10037","display_name":"Physics of Superconductivity and Magnetism","score":0.9316999912261963,"subfield":{"id":"https://openalex.org/subfields/3104","display_name":"Condensed Matter Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.9124000072479248,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.9199264049530029},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.7625097036361694},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.6002581119537354},{"id":"https://openalex.org/keywords/hubbard-model","display_name":"Hubbard model","score":0.58500736951828},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5370330810546875},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.48742011189460754},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47487112879753113},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1750825047492981},{"id":"https://openalex.org/keywords/quantum-mechanics","display_name":"Quantum mechanics","score":0.04008793830871582}],"concepts":[{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.9199264049530029},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.7625097036361694},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.6002581119537354},{"id":"https://openalex.org/C106074065","wikidata":"https://www.wikidata.org/wiki/Q1571298","display_name":"Hubbard model","level":3,"score":0.58500736951828},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5370330810546875},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.48742011189460754},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47487112879753113},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1750825047492981},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.04008793830871582},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C54101563","wikidata":"https://www.wikidata.org/wiki/Q124131","display_name":"Superconductivity","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/978-1-61499-621-7-361","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-361","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},{"id":"mag:2575851384","is_oa":false,"landing_page_url":"https://dblp.uni-trier.de/db/conf/parco/parco2015.html#YamadaIM15","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"Parallel Computing","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3189307731","https://openalex.org/W1428699136","https://openalex.org/W2949962288","https://openalex.org/W2364686214","https://openalex.org/W1998560227","https://openalex.org/W1604758548","https://openalex.org/W2804126825","https://openalex.org/W1549048322","https://openalex.org/W4367553810","https://openalex.org/W2104142636"],"abstract_inverted_index":{"The":[0,103],"graphics":[1],"processing":[2],"unit":[3],"(GPU)":[4],"is":[5,31,65,72,94,111],"an":[6,69],"excellent":[7],"accelerator":[8],"and":[9,46,90],"it":[10],"can":[11],"realize":[12],"speedup":[13,135],"with":[14,116,138],"appropriate":[15],"tuning.":[16],"In":[17],"this":[18],"paper,":[19],"we":[20],"present":[21],"a":[22,35,66,91],"tuning":[23],"technique":[24],"for":[25,74,84,149],"the":[26,40,47,51,55,59,63,76,82,85,88,95,100,108,114,118,125,139,150],"exact":[27],"diagonalization":[28],"method,":[29],"which":[30,93],"widely":[32],"used":[33,73],"as":[34,136],"numerical":[36,104],"tool":[37],"to":[38],"obtain":[39],"ground":[41],"state":[42],"(the":[43],"smallest":[44],"eigenvalue":[45,77],"corresponding":[48],"eigenvector)":[49],"of":[50,87,121,145],"Hamiltonian":[52,64,89],"derived":[53],"from":[54],"Hubbard":[56],"model,":[57],"on":[58,128,142],"GPU":[60],"architecture.":[61],"Since":[62],"sparse":[67],"matrix,":[68],"iteration":[70,101],"method":[71,127],"solving":[75],"problems.":[78],"We":[79],"mainly":[80],"tune":[81],"code":[83,110,141],"multiplication":[86],"vector,":[92],"most":[96],"time-consuming":[97],"operation":[98],"in":[99],"method.":[102],"test":[105],"shows":[106],"that":[107],"tuned":[109,126],"faster":[112],"than":[113],"one":[115],"using":[117],"routine":[119],"&amp;ldquo;cusparseDcsrmm&amp;rdquo;":[120],"cuSPARSE":[122],"library.":[123],"Moreover,":[124],"NVIDIA":[129],"Tesla":[130],"M2075":[131],"achieves":[132],"about":[133],"3&amp;times;":[134],"compared":[137],"thread-parallelized":[140],"six":[143],"threads":[144],"Intel":[146],"Xeon":[147],"5650":[148],"multiplication.":[151]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2017-01-26T00:00:00"}
