{"id":"https://openalex.org/W4415014032","doi":"https://doi.org/10.1002/cpe.70328","title":"Efficient GPU Implementations of Three\u2010Center Two\u2010Electron Repulsion Integrals","display_name":"Efficient GPU Implementations of Three\u2010Center Two\u2010Electron Repulsion Integrals","publication_year":2025,"publication_date":"2025-10-09","ids":{"openalex":"https://openalex.org/W4415014032","doi":"https://doi.org/10.1002/cpe.70328"},"language":"en","primary_location":{"id":"doi:10.1002/cpe.70328","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.70328","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111269964","display_name":"Kanta Suzuki","orcid":null},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kanta Suzuki","raw_affiliation_strings":["Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029487622","display_name":"Yasuaki Ito","orcid":"https://orcid.org/0000-0002-9189-8463"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yasuaki Ito","raw_affiliation_strings":["Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111269963","display_name":"Haruto Fujii","orcid":null},"institutions":[{"id":"https://openalex.org/I2252096349","display_name":"Fujitsu (Japan)","ror":"https://ror.org/038e2g226","country_code":"JP","type":"company","lineage":["https://openalex.org/I2252096349"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Haruto Fujii","raw_affiliation_strings":["Computing Laboratory Fujitsu Limited  Kawasaki Japan"],"affiliations":[{"raw_affiliation_string":"Computing Laboratory Fujitsu Limited  Kawasaki Japan","institution_ids":["https://openalex.org/I2252096349"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108960905","display_name":"Nobuya Yokogawa","orcid":null},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nobuya Yokogawa","raw_affiliation_strings":["Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107945532","display_name":"Satoki Tsuji","orcid":null},"institutions":[{"id":"https://openalex.org/I2252096349","display_name":"Fujitsu (Japan)","ror":"https://ror.org/038e2g226","country_code":"JP","type":"company","lineage":["https://openalex.org/I2252096349"]},{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Satoki Tsuji","raw_affiliation_strings":["Computing Laboratory Fujitsu Limited  Kawasaki Japan","Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Computing Laboratory Fujitsu Limited  Kawasaki Japan","institution_ids":["https://openalex.org/I2252096349"]},{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086055038","display_name":"Koji Nakano","orcid":"https://orcid.org/0000-0002-2040-4032"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Koji Nakano","raw_affiliation_strings":["Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046692303","display_name":"Victor Parque","orcid":"https://orcid.org/0000-0001-7329-1468"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Victor Parque","raw_affiliation_strings":["Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Engineering Hiroshima University  Higashi\u2010Hiroshima Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089627100","display_name":"Akihiko Kasagi","orcid":"https://orcid.org/0000-0002-5793-335X"},"institutions":[{"id":"https://openalex.org/I2252096349","display_name":"Fujitsu (Japan)","ror":"https://ror.org/038e2g226","country_code":"JP","type":"company","lineage":["https://openalex.org/I2252096349"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Akihiko Kasagi","raw_affiliation_strings":["Computing Laboratory Fujitsu Limited  Kawasaki Japan"],"affiliations":[{"raw_affiliation_string":"Computing Laboratory Fujitsu Limited  Kawasaki Japan","institution_ids":["https://openalex.org/I2252096349"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5029487622"],"corresponding_institution_ids":["https://openalex.org/I113306721"],"apc_list":{"value":4740,"currency":"USD","value_usd":4740},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27968168,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"37","issue":"25-26","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12039","display_name":"Electron and X-Ray Spectroscopy Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/2508","display_name":"Surfaces, Coatings and Films"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12039","display_name":"Electron and X-Ray Spectroscopy Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/2508","display_name":"Surfaces, Coatings and Films"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9702000021934509,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11809","display_name":"Advanced NMR Techniques and Applications","score":0.9495000243186951,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.6881999969482422},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.6057999730110168},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5200999975204468},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4977000057697296},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4790000021457672},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.45179998874664307},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.450300008058548},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.41600000858306885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8370000123977661},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.6881999969482422},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6277999877929688},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.6057999730110168},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5200999975204468},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4977000057697296},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4790000021457672},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.45969998836517334},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.45179998874664307},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.450300008058548},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.4000999927520752},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.39239999651908875},{"id":"https://openalex.org/C2778400913","wikidata":"https://www.wikidata.org/wiki/Q1639024","display_name":"Mathematical software","level":3,"score":0.3668999969959259},{"id":"https://openalex.org/C2983609787","wikidata":"https://www.wikidata.org/wiki/Q10534782","display_name":"Software implementation","level":3,"score":0.35749998688697815},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.3531999886035919},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.34709998965263367},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30550000071525574},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.30309998989105225},{"id":"https://openalex.org/C19754495","wikidata":"https://www.wikidata.org/wiki/Q3435924","display_name":"Computational problem","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C2991951333","wikidata":"https://www.wikidata.org/wiki/Q188403","display_name":"Quantum chemical","level":3,"score":0.287200003862381},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C2984968299","wikidata":"https://www.wikidata.org/wiki/Q1077784","display_name":"Software tool","level":3,"score":0.2554999887943268}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1002/cpe.70328","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.70328","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W1979891593","https://openalex.org/W2016293616","https://openalex.org/W2029228724","https://openalex.org/W2038305447","https://openalex.org/W2039574885","https://openalex.org/W2044424215","https://openalex.org/W2044682544","https://openalex.org/W2050036547","https://openalex.org/W2050670694","https://openalex.org/W2051469879","https://openalex.org/W2054510591","https://openalex.org/W2057061175","https://openalex.org/W2069862573","https://openalex.org/W2072099189","https://openalex.org/W2076937878","https://openalex.org/W2082691688","https://openalex.org/W2109665034","https://openalex.org/W2141191373","https://openalex.org/W2145454068","https://openalex.org/W2154558448","https://openalex.org/W2155417823","https://openalex.org/W2168299072","https://openalex.org/W2323616528","https://openalex.org/W2332752561","https://openalex.org/W2333743632","https://openalex.org/W2715494257","https://openalex.org/W2756519801","https://openalex.org/W2906538035","https://openalex.org/W2914097545","https://openalex.org/W2948577671","https://openalex.org/W2972996945","https://openalex.org/W2979795026","https://openalex.org/W3017260797","https://openalex.org/W3046033601","https://openalex.org/W3099200606","https://openalex.org/W3102453744","https://openalex.org/W3103102238","https://openalex.org/W3164526122","https://openalex.org/W3184441673","https://openalex.org/W3213110411","https://openalex.org/W4293168632","https://openalex.org/W4302761325","https://openalex.org/W4311199948","https://openalex.org/W4322724459","https://openalex.org/W4324128805","https://openalex.org/W4375856279","https://openalex.org/W4386530547","https://openalex.org/W4389671635","https://openalex.org/W4400087543","https://openalex.org/W4401766595","https://openalex.org/W4404110586","https://openalex.org/W4404501286","https://openalex.org/W4405935055","https://openalex.org/W4405935343","https://openalex.org/W4405935531","https://openalex.org/W4408034148","https://openalex.org/W4409067472","https://openalex.org/W4409804829","https://openalex.org/W4410322104"],"related_works":[],"abstract_inverted_index":{"ABSTRACT":[0],"In":[1],"computational":[2,33,102,140],"quantum":[3,182,219],"chemistry,":[4],"the":[5,23,30,35,40,52,101,113,159,162,207,212],"computation":[6],"of":[7,26,42,49,54,70,115,118,156,217],"three\u2010center":[8,14,93,174],"two\u2010electron":[9,94],"repulsion":[10],"integrals":[11,95],"(also":[12],"termed":[13],"ERIs)":[15],"is":[16,58],"essential":[17],"for":[18,92],"density":[19],"fitting.":[20],"Due":[21],"to":[22,45,60,78,169,172,180,194,200,209],"large":[24],"number":[25],"integral":[27],"elements":[28],"and":[29,68,127,133,153,188,198,215],"induced":[31],"combinatorial":[32],"complexity,":[34],"community":[36],"has":[37,206],"actively":[38],"pursued":[39],"acceleration/speedup":[41],"ERI":[43],"calculations":[44],"achieve":[46],"pragmatic":[47],"levels":[48],"efficiency.":[50],"From":[51],"perspective":[53],"GPU":[55,75],"acceleration,":[56],"atomicAdd":[57,122],"known":[59],"incur":[61],"significant":[62],"memory":[63,76],"overhead:":[64],"The":[65],"frequent":[66],"collisions":[67],"retrials":[69],"value":[71,106],"aggregation":[72],"in":[73],"global":[74],"lead":[77],"substantial":[79],"performance":[80],"degradation.":[81],"To":[82],"tackle":[83],"this":[84],"issue,":[85],"we":[86],"propose":[87],"new":[88],"thread":[89,164],"mapping":[90,165],"strategies":[91],"on":[96,112],"GPUs,":[97],"aiming":[98],"at":[99],"reducing":[100],"cost":[103],"associated":[104],"with":[105,124],"aggregation.":[107],"Our":[108,204],"methods":[109],"are":[110],"based":[111],"idea":[114],"suitable":[116],"substitutions":[117],"device\u2010level":[119],"reduction":[120],"(":[121],")":[123],"efficient":[125],"warp\u2010":[126],"thread\u2010level":[128],"reduction,":[129],"such":[130,185],"as":[131,186],"warp\u2010shuffle":[132],"register":[134],"accumulation.":[135],"As":[136],"a":[137],"result,":[138],"our":[139,190],"experiments":[141],"using":[142],"an":[143,149],"Intel":[144],"Xeon":[145],"Gold":[146],"6338":[147],"CPU,":[148],"NVIDIA":[150],"A100":[151],"GPU,":[152],"relevant":[154],"molecules":[155],"interest":[157],"show":[158],"superiority":[160],"against":[161],"conventional":[163],"scheme,":[166],"achieving":[167],"up":[168,193,199],"2.76":[170],"speedups":[171,195,201],"compute":[173],"ERIs":[175],"more":[176],"efficiently.":[177],"Moreover,":[178],"compared":[179],"well\u2010known":[181],"chemistry":[183],"software":[184],"PySCF":[187,197],"GPU4PySCF,":[189],"method":[191,205],"achieved":[192],"over":[196,202],"GPU4PySCF.":[203],"potential":[208],"further":[210],"enhance":[211],"performance,":[213],"extensibility,":[214],"versatility":[216],"GPU\u2010accelerated":[218],"chemical":[220],"computations.":[221]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
