{"id":"https://openalex.org/W2005641483","doi":"https://doi.org/10.1145/1926367.1926378","title":"An efficient CELL library for lattice quantum chromodynamics","display_name":"An efficient CELL library for lattice quantum chromodynamics","publication_year":2010,"publication_date":"2010-09-14","ids":{"openalex":"https://openalex.org/W2005641483","doi":"https://doi.org/10.1145/1926367.1926378","mag":"2005641483"},"language":"en","primary_location":{"id":"doi:10.1145/1926367.1926378","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1926367.1926378","pdf_url":null,"source":{"id":"https://openalex.org/S4210193905","display_name":"ACM SIGARCH Computer Architecture News","issn_l":"0163-5964","issn":["0163-5964","1943-5851"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320740","host_organization_name":"ACM SIGARCH","host_organization_lineage":["https://openalex.org/P4310320740"],"host_organization_lineage_names":["ACM SIGARCH"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGARCH Computer Architecture News","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057912061","display_name":"Claude Tadonki","orcid":"https://orcid.org/0000-0003-1194-6400"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210133362","display_name":"Institut National de Physique Nucl\u00e9aire et de Physique des Particules","ror":"https://ror.org/03fd77x13","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I4210133362"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Claude Tadonki","raw_affiliation_strings":["Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France"],"affiliations":[{"raw_affiliation_string":"Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France","institution_ids":["https://openalex.org/I4210133362","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091229430","display_name":"Gilbert Grodidier","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133362","display_name":"Institut National de Physique Nucl\u00e9aire et de Physique des Particules","ror":"https://ror.org/03fd77x13","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I4210133362"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Gilbert Grodidier","raw_affiliation_strings":["Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France"],"affiliations":[{"raw_affiliation_string":"Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France","institution_ids":["https://openalex.org/I4210133362","https://openalex.org/I1294671590"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033790979","display_name":"O. P\u00e8ne","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133362","display_name":"Institut National de Physique Nucl\u00e9aire et de Physique des Particules","ror":"https://ror.org/03fd77x13","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I4210133362"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Olivier Pene","raw_affiliation_strings":["Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France"],"affiliations":[{"raw_affiliation_string":"Linear Accelerator Laboratory/CNRS/IN2P3, University of Orsay, Faculty of Sciences, Orsay Cedex, France","institution_ids":["https://openalex.org/I4210133362","https://openalex.org/I1294671590"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5057912061"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210133362"],"apc_list":null,"apc_paid":null,"fwci":1.0478,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.87626977,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"38","issue":"4","first_page":"60","last_page":"65"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10048","display_name":"Particle physics theoretical and experimental studies","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10048","display_name":"Particle physics theoretical and experimental studies","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10224","display_name":"Quantum Chromodynamics and Particle Interactions","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7113704085350037},{"id":"https://openalex.org/keywords/quantum-chromodynamics","display_name":"Quantum chromodynamics","score":0.6818385124206543},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6515138149261475},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.528901994228363},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.5066126585006714},{"id":"https://openalex.org/keywords/lattice-qcd","display_name":"Lattice QCD","score":0.45716702938079834},{"id":"https://openalex.org/keywords/quantum-computer","display_name":"Quantum computer","score":0.4353444278240204},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4225788712501526},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.3937608301639557},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3693752884864807},{"id":"https://openalex.org/keywords/statistical-physics","display_name":"Statistical physics","score":0.34654414653778076},{"id":"https://openalex.org/keywords/particle-physics","display_name":"Particle physics","score":0.33977457880973816},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1955024003982544},{"id":"https://openalex.org/keywords/quantum-mechanics","display_name":"Quantum mechanics","score":0.17873826622962952}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7113704085350037},{"id":"https://openalex.org/C117137515","wikidata":"https://www.wikidata.org/wiki/Q238170","display_name":"Quantum chromodynamics","level":2,"score":0.6818385124206543},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6515138149261475},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.528901994228363},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.5066126585006714},{"id":"https://openalex.org/C3909970","wikidata":"https://www.wikidata.org/wiki/Q6166044","display_name":"Lattice QCD","level":3,"score":0.45716702938079834},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.4353444278240204},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4225788712501526},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.3937608301639557},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3693752884864807},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.34654414653778076},{"id":"https://openalex.org/C109214941","wikidata":"https://www.wikidata.org/wiki/Q18334","display_name":"Particle physics","level":1,"score":0.33977457880973816},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1955024003982544},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.17873826622962952}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1926367.1926378","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1926367.1926378","pdf_url":null,"source":{"id":"https://openalex.org/S4210193905","display_name":"ACM SIGARCH Computer Architecture News","issn_l":"0163-5964","issn":["0163-5964","1943-5851"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320740","host_organization_name":"ACM SIGARCH","host_organization_lineage":["https://openalex.org/P4310320740"],"host_organization_lineage_names":["ACM SIGARCH"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGARCH Computer Architecture News","raw_type":"journal-article"},{"id":"pmh:oai:HAL:in2p3-00564860v1","is_oa":false,"landing_page_url":"https://in2p3.hal.science/in2p3-00564860","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"International Workshop on Highly-efficient accelerators and reconfigurable Technologies (HEART2010) and 24th International Conference on Supercomputing (ICS'10), Jun 2010, Tsukuba, Japan. pp.60-65, &#x27E8;10.1145/1926367.1926378&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.5400000214576721,"display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W584037522","https://openalex.org/W1506708129","https://openalex.org/W1975715716","https://openalex.org/W1991372770","https://openalex.org/W2002999444","https://openalex.org/W2014116693","https://openalex.org/W2124661136","https://openalex.org/W2153092996","https://openalex.org/W2155967869","https://openalex.org/W2286689978","https://openalex.org/W2507158857","https://openalex.org/W3100964872","https://openalex.org/W6725191152"],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W2146343568","https://openalex.org/W1617702743","https://openalex.org/W2014749024","https://openalex.org/W2953067234","https://openalex.org/W2153122142","https://openalex.org/W1541032752","https://openalex.org/W3212303847","https://openalex.org/W4302617997"],"abstract_inverted_index":{"Quantum":[0,37],"chromodynamics":[1],"(QCD)":[2],"is":[3,17,73,80,89,114,196,227],"the":[4,12,20,52,92,108,121,124,139,225],"theory":[5],"of":[6,22,45,55,64,105,162,213],"subnuclear":[7],"physics,":[8],"aiming":[9],"at":[10],"modeling":[11],"strong":[13],"nuclear":[14,23],"force,":[15],"which":[16],"responsible":[18],"for":[19,67,83,190,232],"interactions":[21],"particles.":[24],"Numerical":[25],"QCD":[26],"studies":[27],"are":[28],"performed":[29],"through":[30],"a":[31,62,76,127,159,174,185,204,210,228],"discrete":[32],"formalism":[33],"called":[34],"LQCD":[35,69,165,234],"(Lattice":[36],"Chromodynamics).":[38],"Typical":[39],"simulations":[40],"involve":[41],"very":[42,229],"large":[43],"volume":[44],"data":[46,131],"and":[47,79,94,120,133,142],"numerically":[48],"sensitive":[49],"entities,":[50],"thus":[51],"crucial":[53],"need":[54],"high":[56],"performance":[57],"computing":[58],"systems.":[59],"We":[60,150],"propose":[61],"set":[63],"CELL-accelerated":[65],"routines":[66,172],"basic":[68],"calculations.":[70],"Our":[71,111,220],"framework":[72],"provided":[74],"as":[75,217],"unified":[77],"library":[78,153],"particularly":[81],"optimized":[82],"an":[84,163],"iterative":[85],"use.":[86],"Each":[87],"routine":[88],"parallelized":[90],"among":[91],"SPUs,":[93],"each":[95],"SPU":[96,112,140],"achieves":[97],"it":[98,156],"task":[99],"by":[100,154],"looping":[101],"on":[102,170],"small":[103],"chunk":[104],"arrays":[106],"from":[107],"main":[109],"memory.":[110],"implementation":[113],"vectorized":[115],"with":[116,123],"double":[117],"precision":[118],"data,":[119],"cooperation":[122],"PPU":[125],"shows":[126],"good":[128],"overlap":[129],"between":[130,147],"transfers":[132],"computations.":[134],"Moreover,":[135],"we":[136],"permanently":[137],"keep":[138],"context":[141,207],"use":[143],"mailboxes":[144],"to":[145,157,178],"synchronize":[146],"consecutive":[148],"calls.":[149],"validate":[151],"our":[152],"using":[155],"derive":[158],"CELL":[160,226],"version":[161],"existing":[164],"package":[166],"(tmLQCD).":[167],"Experimental":[168],"results":[169,221],"individual":[171],"show":[173],"significant":[175],"speedup":[176],"compare":[177],"standard":[179],"processor,":[180],"11":[181],"times":[182],"better":[183],"than":[184],"2.83":[186],"GHz":[187],"INTEL":[188],"processor":[189],"instance":[191],"(without":[192],"SSE).":[193],"This":[194],"ratio":[195],"around":[197],"9":[198],"(with":[199],"QS22":[200],"blade)":[201],"when":[202],"consider":[203],"more":[205],"cooperative":[206],"like":[208],"solving":[209],"linear":[211],"system":[212],"equations":[214],"(usually":[215],"referred":[216],"Wislon-Dirac":[218],"inversion).":[219],"clearly":[222],"demonstrate":[223],"that":[224],"promising":[230],"way":[231],"high-scale":[233],"simulations.":[235]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
