{"id":"https://openalex.org/W2947212999","doi":"https://doi.org/10.14529/jsfi190106","title":"Performance Evaluation of Different Implementation Schemes of an Iterative Flow Solver on Modern Vector Machines","display_name":"Performance Evaluation of Different Implementation Schemes of an Iterative Flow Solver on Modern Vector Machines","publication_year":2019,"publication_date":"2019-03-01","ids":{"openalex":"https://openalex.org/W2947212999","doi":"https://doi.org/10.14529/jsfi190106","mag":"2947212999"},"language":"en","primary_location":{"id":"doi:10.14529/jsfi190106","is_oa":true,"landing_page_url":"https://doi.org/10.14529/jsfi190106","pdf_url":null,"source":{"id":"https://openalex.org/S4210177204","display_name":"Supercomputing Frontiers and Innovations","issn_l":"2313-8734","issn":["2313-8734","2409-6008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310312680","host_organization_name":"Publishing center of the South Ural State University","host_organization_lineage":["https://openalex.org/P4310312680"],"host_organization_lineage_names":["Publishing center of the South Ural State University"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Supercomputing Frontiers and Innovations","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.14529/jsfi190106","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113218531","display_name":"Kenta Yamaguchi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kenta Yamaguchi","raw_affiliation_strings":["NEC Solution Innovators"],"affiliations":[{"raw_affiliation_string":"NEC Solution Innovators","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101062490","display_name":"Takashi Soga","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Takashi Soga","raw_affiliation_strings":["NEC Solution Innovators"],"affiliations":[{"raw_affiliation_string":"NEC Solution Innovators","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017079169","display_name":"Yoichi Shimomura","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoichi Shimomura","raw_affiliation_strings":["NEC Solution Innovators"],"affiliations":[{"raw_affiliation_string":"NEC Solution Innovators","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018940170","display_name":"Thorsten Reimann","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Thorsten Reimann","raw_affiliation_strings":["Technische Universit\u00e4t Darmstadt"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Darmstadt","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051997684","display_name":"Kazuhiko Komatsu","orcid":"https://orcid.org/0000-0003-4463-8359"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuhiko Komatsu","raw_affiliation_strings":["Tohoku University"],"affiliations":[{"raw_affiliation_string":"Tohoku University","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033954091","display_name":"Ryusuke Egawa","orcid":"https://orcid.org/0000-0001-8966-867X"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ryusuke Egawa","raw_affiliation_strings":["Tohoku University"],"affiliations":[{"raw_affiliation_string":"Tohoku University","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032678092","display_name":"Akihiro Musa","orcid":"https://orcid.org/0000-0002-2161-658X"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Akihiro Musa","raw_affiliation_strings":["Tohoku University"],"affiliations":[{"raw_affiliation_string":"Tohoku University","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011172934","display_name":"Hiroyuki Takizawa","orcid":"https://orcid.org/0000-0003-2858-3140"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroyuki Takizawa","raw_affiliation_strings":["Tohoku University"],"affiliations":[{"raw_affiliation_string":"Tohoku University","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007893254","display_name":"Hiroaki Kobayashi","orcid":"https://orcid.org/0000-0002-3350-1413"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroaki Kobayashi","raw_affiliation_strings":["Tohoku University"],"affiliations":[{"raw_affiliation_string":"Tohoku University","institution_ids":["https://openalex.org/I201537933"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5113218531"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.7074,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.72643417,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"6","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.978600025177002,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11751","display_name":"Lattice Boltzmann Simulation Studies","score":0.972000002861023,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.9286651611328125},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8198236227035522},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8185229301452637},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.7918248176574707},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.7895832657814026},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.7543905973434448},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.6324160695075989},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5694140195846558},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.5631070137023926},{"id":"https://openalex.org/keywords/vector-processor","display_name":"Vector processor","score":0.48993533849716187},{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.4596869647502899},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3838474154472351},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1435854732990265}],"concepts":[{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.9286651611328125},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8198236227035522},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8185229301452637},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.7918248176574707},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.7895832657814026},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.7543905973434448},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.6324160695075989},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5694140195846558},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.5631070137023926},{"id":"https://openalex.org/C161824985","wikidata":"https://www.wikidata.org/wiki/Q919509","display_name":"Vector processor","level":2,"score":0.48993533849716187},{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.4596869647502899},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3838474154472351},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1435854732990265},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14529/jsfi190106","is_oa":true,"landing_page_url":"https://doi.org/10.14529/jsfi190106","pdf_url":null,"source":{"id":"https://openalex.org/S4210177204","display_name":"Supercomputing Frontiers and Innovations","issn_l":"2313-8734","issn":["2313-8734","2409-6008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310312680","host_organization_name":"Publishing center of the South Ural State University","host_organization_lineage":["https://openalex.org/P4310312680"],"host_organization_lineage_names":["Publishing center of the South Ural State University"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Supercomputing Frontiers and Innovations","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.14529/jsfi190106","is_oa":true,"landing_page_url":"https://doi.org/10.14529/jsfi190106","pdf_url":null,"source":{"id":"https://openalex.org/S4210177204","display_name":"Supercomputing Frontiers and Innovations","issn_l":"2313-8734","issn":["2313-8734","2409-6008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310312680","host_organization_name":"Publishing center of the South Ural State University","host_organization_lineage":["https://openalex.org/P4310312680"],"host_organization_lineage_names":["Publishing center of the South Ural State University"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Supercomputing Frontiers and Innovations","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W1487200290","https://openalex.org/W1557212109","https://openalex.org/W2045244586","https://openalex.org/W2079810565","https://openalex.org/W2124192278","https://openalex.org/W2294681552","https://openalex.org/W2592594796"],"related_works":["https://openalex.org/W1908180445","https://openalex.org/W3092174096","https://openalex.org/W3205799311","https://openalex.org/W2739740241","https://openalex.org/W2035419609","https://openalex.org/W2269110805","https://openalex.org/W2912502764","https://openalex.org/W1766386015","https://openalex.org/W2895895456","https://openalex.org/W2612377115"],"abstract_inverted_index":{"Modern":[0],"supercomputers":[1,81,106,212],"consist":[2],"of":[3,53,95,216],"multi-core":[4],"processors,":[5],"and":[6,59,126,130,171,190,193,201],"these":[7,34],"processors":[8],"have":[9,42],"recently":[10],"employed":[11],"vector":[12,68],"instructions,":[13,17],"or":[14],"so-called":[15],"SIMD":[16],"to":[18,24,29,73,84,109,117,154,231],"improve":[19],"performances.":[20],"Numerical":[21],"simulations":[22],"need":[23],"be":[25],"vectorized":[26,61,128],"in":[27,82,107],"order":[28,83,108],"achieve":[30,85,232],"higher":[31,86,207],"performance":[32,162,208,234],"on":[33,104,163,188,198,209,235],"processors.":[35],"Various":[36],"legacy":[37,97],"numerical":[38],"simulation":[39,100],"codes":[40,116],"that":[41,63,177,223],"been":[43],"utilized":[44],"for":[45,66,79,113,138],"a":[46,56,60,96,111,123,127,206],"long":[47],"time":[48],"often":[49],"contain":[50],"two":[51],"versions":[52],"source":[54],"codes:":[55],"non-vectorized":[57,196],"version":[58,62,76,125,197],"is":[64,71,77,151,228],"optimized":[65],"old":[67],"supercomputers.":[69,119,237],"It":[70],"important":[72],"clarify":[74],"which":[75,150],"better":[78],"modern":[80,105,118,211,236],"performance.":[87],"In":[88],"this":[89],"paper,":[90],"we":[91,143,159],"evaluate":[92],"the":[93,131,134,141,146,156,161,178,184,195,224],"performances":[94],"fluid":[98],"dynamics":[99],"code":[101,218],"called":[102],"FASTEST":[103],"provide":[110],"guidepost":[112],"migrating":[114],"such":[115],"The":[120,174],"solver":[121],"has":[122],"nonvectorized":[124],"version,":[129],"latter":[132],"uses":[133],"hyperplane":[135],"ordering":[136,148,186,226],"method":[137,187,227],"vectorization.":[139],"For":[140],"evaluation,":[142],"also":[144,221],"implement":[145],"red-black":[147,185,225],"method,":[149],"another":[152],"way":[153],"vectorize":[155],"solver.":[157],"Then,":[158],"examine":[160],"NEC":[164],"SX-ACE,":[165],"SXAurora":[166],"TSUBASA,":[167,192],"Intel":[168],"Xeon":[169,172,199,202],"Gold,":[170],"Phi.":[173,203],"results":[175],"show":[176,222],"shortest":[179],"execution":[180],"times":[181],"are":[182],"with":[183,194],"SX-ACE":[189],"SX-Aurora":[191],"Gold":[200],"Therefore,":[204],"achieving":[205],"multiple":[210,217],"potentially":[213],"requires":[214],"maintenance":[215],"versions.":[219],"We":[220],"more":[229],"promising":[230],"high":[233]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2019-06-07T00:00:00"}
