{"id":"https://openalex.org/W7129521724","doi":"https://doi.org/10.48550/arxiv.2602.14450","title":"Mixed precision solvers with half-precision floating point numbers for Lattice QCD on A64FX processor","display_name":"Mixed precision solvers with half-precision floating point numbers for Lattice QCD on A64FX processor","publication_year":2026,"publication_date":"2026-02-16","ids":{"openalex":"https://openalex.org/W7129521724","doi":"https://doi.org/10.48550/arxiv.2602.14450"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.14450","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.14450","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.14450","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126257370","display_name":"Issaku Kanamori","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kanamori, Issaku","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Matsufuru, Hideo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matsufuru, Hideo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126257923","display_name":"Tatsumi Aoyama","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aoyama, Tatsumi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126254988","display_name":"Kazuyuki Kanaya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kanaya, Kazuyuki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032016726","display_name":"Yusuke Namekawa","orcid":"https://orcid.org/0000-0002-3578-5085"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Namekawa, Yusuke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004154860","display_name":"Hidekatsu Nemura","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nemura, Hidekatsu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5022962037","display_name":"Keigo Nitadori","orcid":"https://orcid.org/0000-0001-7374-4236"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nitadori, Keigo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.1200999990105629,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.1200999990105629,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10048","display_name":"Particle physics theoretical and experimental studies","score":0.10949999839067459,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10224","display_name":"Quantum Chromodynamics and Particle Interactions","score":0.10589999705553055,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/biconjugate-gradient-stabilized-method","display_name":"Biconjugate gradient stabilized method","score":0.8787999749183655},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.7749000191688538},{"id":"https://openalex.org/keywords/double-precision-floating-point-format","display_name":"Double-precision floating-point format","score":0.5637999773025513},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.5526999831199646},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.46160000562667847},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.44679999351501465},{"id":"https://openalex.org/keywords/lattice","display_name":"Lattice (music)","score":0.43059998750686646},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.4296000003814697},{"id":"https://openalex.org/keywords/single-precision-floating-point-format","display_name":"Single-precision floating-point format","score":0.41130000352859497}],"concepts":[{"id":"https://openalex.org/C120553275","wikidata":"https://www.wikidata.org/wiki/Q4903720","display_name":"Biconjugate gradient stabilized method","level":3,"score":0.8787999749183655},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.7749000191688538},{"id":"https://openalex.org/C35912277","wikidata":"https://www.wikidata.org/wiki/Q1243369","display_name":"Double-precision floating-point format","level":3,"score":0.5637999773025513},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.5526999831199646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5224999785423279},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.47350001335144043},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.46160000562667847},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.44679999351501465},{"id":"https://openalex.org/C2781204021","wikidata":"https://www.wikidata.org/wiki/Q6497091","display_name":"Lattice (music)","level":2,"score":0.43059998750686646},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.4296000003814697},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4251999855041504},{"id":"https://openalex.org/C133095886","wikidata":"https://www.wikidata.org/wiki/Q1307173","display_name":"Single-precision floating-point format","level":3,"score":0.41130000352859497},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.4041999876499176},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3937000036239624},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38679999113082886},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.351500004529953},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.34769999980926514},{"id":"https://openalex.org/C2779982483","wikidata":"https://www.wikidata.org/wiki/Q6094420","display_name":"Iterative refinement","level":2,"score":0.3456999957561493},{"id":"https://openalex.org/C203739276","wikidata":"https://www.wikidata.org/wiki/Q1780355","display_name":"Machine epsilon","level":2,"score":0.3244999945163727},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.30570000410079956},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C83581934","wikidata":"https://www.wikidata.org/wiki/Q527381","display_name":"Arbitrary-precision arithmetic","level":2,"score":0.29760000109672546},{"id":"https://openalex.org/C3909970","wikidata":"https://www.wikidata.org/wiki/Q6166044","display_name":"Lattice QCD","level":3,"score":0.2971999943256378},{"id":"https://openalex.org/C157449380","wikidata":"https://www.wikidata.org/wiki/Q1030759","display_name":"Fixed-point iteration","level":3,"score":0.2847999930381775},{"id":"https://openalex.org/C89408827","wikidata":"https://www.wikidata.org/wiki/Q855169","display_name":"Biconjugate gradient method","level":5,"score":0.2648000121116638},{"id":"https://openalex.org/C44274781","wikidata":"https://www.wikidata.org/wiki/Q6497132","display_name":"Lattice reduction","level":4,"score":0.25859999656677246},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C48753275","wikidata":"https://www.wikidata.org/wiki/Q11216","display_name":"Numerical analysis","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.14450","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.14450","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.14450","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.14450","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,115],"investigate":[1],"the":[2,18,52,66,72,88,94,100,108,118],"use":[3],"of":[4,20,54],"half-precision":[5],"floating-point":[6],"numbers":[7],"(FP16)":[8],"in":[9,38,64,129],"mixed-precision":[10,24],"linear":[11],"solvers":[12],"for":[13,22,113],"lattice":[14],"QCD":[15],"simulations.":[16],"Since":[17],"emergence":[19],"GPUs":[21],"general-purpose,":[23],"algorithms":[25],"that":[26,107,117],"combine":[27],"single-precision":[28],"(FP32)":[29],"with":[30,83],"double-precision":[31],"(FP64)":[32],"arithmetics":[33],"have":[34],"become":[35],"widely":[36],"used":[37],"this":[39,58],"field":[40],"and":[41,71,93],"others.":[42],"While":[43],"FP32-based":[44],"methods":[45,121],"are":[46],"now":[47],"well":[48],"established,":[49],"we":[50,60],"examine":[51],"practicality":[53],"using":[55],"FP16.":[56],"In":[57,80],"work,":[59],"introduce":[61],"rescaling":[62,120],"steps":[63],"both":[65],"outer":[67],"iterative":[68],"refinement":[69],"step":[70],"inner":[73],"BiCGStab":[74],"solver":[75,89],"to":[76,99],"avoid":[77],"numerical":[78],"instability.":[79],"our":[81],"experiments":[82],"a":[84],"simple":[85],"Wilson":[86],"kernel,":[87],"shows":[90],"improved":[91],"stability,":[92],"additional":[95],"iteration":[96],"count":[97],"compared":[98],"FP64":[101],"version":[102,110],"remains":[103],"within":[104],"20\\%,":[105],"indicating":[106],"FP16":[109],"is":[111],"practical":[112],"use.":[114],"believe":[116],"proposed":[119],"can":[122],"also":[123],"benefit":[124],"other":[125],"mixed":[126],"precision":[127],"preconditioners":[128],"avoiding":[130],"underflows.":[131]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-18T00:00:00"}
