{"id":"https://openalex.org/W2033096236","doi":"https://doi.org/10.1137/s1064827502410530","title":"Code Optimizations for Complex Microprocessors Applied to CFD Software","display_name":"Code Optimizations for Complex Microprocessors Applied to CFD Software","publication_year":2004,"publication_date":"2004-01-01","ids":{"openalex":"https://openalex.org/W2033096236","doi":"https://doi.org/10.1137/s1064827502410530","mag":"2033096236"},"language":"en","primary_location":{"id":"doi:10.1137/s1064827502410530","is_oa":false,"landing_page_url":"https://doi.org/10.1137/s1064827502410530","pdf_url":null,"source":{"id":"https://openalex.org/S165512578","display_name":"SIAM Journal on Scientific Computing","issn_l":"1064-8275","issn":["1064-8275","1095-7197"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Scientific Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045530644","display_name":"Thomas H\u00e4user","orcid":"https://orcid.org/0000-0003-1170-6749"},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Th. Hauser","raw_affiliation_strings":["Utah State University"],"affiliations":[{"raw_affiliation_string":"Utah State University","institution_ids":["https://openalex.org/I121980950"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013020019","display_name":"Timothy I. Mattox","orcid":"https://orcid.org/0000-0001-5265-4848"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"T. I. Mattox","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053913983","display_name":"Raymond LeBeau","orcid":null},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"R. P. LeBeau","raw_affiliation_strings":["Utah State University"],"affiliations":[{"raw_affiliation_string":"Utah State University","institution_ids":["https://openalex.org/I121980950"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109219565","display_name":"H. G. Dietz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"H. G. Dietz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5033413049","display_name":"Po-Yu Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"P. G. Huang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5045530644"],"corresponding_institution_ids":["https://openalex.org/I121980950"],"apc_list":null,"apc_paid":null,"fwci":2.6283,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.88313942,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"25","issue":"4","first_page":"1461","last_page":"1477"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10173","display_name":"Computational Fluid Dynamics and Aerodynamics","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10173","display_name":"Computational Fluid Dynamics and Aerodynamics","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11751","display_name":"Lattice Boltzmann Simulation Studies","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8034632802009583},{"id":"https://openalex.org/keywords/computational-fluid-dynamics","display_name":"Computational fluid dynamics","score":0.762473464012146},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6789623498916626},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.6059787273406982},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5132274627685547},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.5014810562133789},{"id":"https://openalex.org/keywords/subroutine","display_name":"Subroutine","score":0.4790705144405365},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4652377665042877},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4579957127571106},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.4265119433403015},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.42495396733283997},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.16159215569496155},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1326216757297516},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08024165034294128},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07802385091781616}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8034632802009583},{"id":"https://openalex.org/C1633027","wikidata":"https://www.wikidata.org/wiki/Q815820","display_name":"Computational fluid dynamics","level":2,"score":0.762473464012146},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6789623498916626},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.6059787273406982},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5132274627685547},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.5014810562133789},{"id":"https://openalex.org/C96147967","wikidata":"https://www.wikidata.org/wiki/Q190686","display_name":"Subroutine","level":2,"score":0.4790705144405365},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4652377665042877},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4579957127571106},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.4265119433403015},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.42495396733283997},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.16159215569496155},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1326216757297516},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08024165034294128},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07802385091781616},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1137/s1064827502410530","is_oa":false,"landing_page_url":"https://doi.org/10.1137/s1064827502410530","pdf_url":null,"source":{"id":"https://openalex.org/S165512578","display_name":"SIAM Journal on Scientific Computing","issn_l":"1064-8275","issn":["1064-8275","1095-7197"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Scientific Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.5099999904632568,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W80878036","https://openalex.org/W1465881795","https://openalex.org/W1488775318","https://openalex.org/W1547830536","https://openalex.org/W1555915743","https://openalex.org/W2015861747","https://openalex.org/W2064370164","https://openalex.org/W2113197229","https://openalex.org/W2115215129","https://openalex.org/W2135653967","https://openalex.org/W2144433126","https://openalex.org/W2731838813","https://openalex.org/W3010292040"],"related_works":["https://openalex.org/W2391861012","https://openalex.org/W2488336788","https://openalex.org/W4285469493","https://openalex.org/W1593224248","https://openalex.org/W2080384954","https://openalex.org/W2375766869","https://openalex.org/W4382519933","https://openalex.org/W3151465598","https://openalex.org/W2368144149","https://openalex.org/W316204541"],"abstract_inverted_index":{"Improving":[0],"large":[1],"scale,":[2],"time-dependent":[3],"numerical":[4],"simulation":[5],"of":[6,15,54,61,98,127,129,150,170],"the":[7,13,34,52,103,111,124,130,133,156,168,171],"Navier--Stokes":[8,92],"equations":[9],"is":[10,49,117,153],"critical":[11],"for":[12,135],"future":[14],"computational":[16,125,157],"fluid":[17],"dynamics":[18],"(CFD)":[19],"in":[20,37,51,164],"engineering":[21],"applications.":[22],"Unfortunately,":[23],"these":[24,151],"computations":[25,48],"require":[26,66],"massive,":[27],"and":[28,82,88,139],"generally":[29],"expensive,":[30],"computing":[31],"resources.":[32],"With":[33],"continuing":[35],"advances":[36],"commodity":[38],"computer":[39],"hardware,":[40],"an":[41],"alternative":[42],"approach":[43],"to":[44,58,90,119,154],"computationally":[45],"expensive":[46],"CFD":[47,64,105],"emerging":[50],"form":[53],"PC":[55,100,175],"clusters.":[56],"However,":[57],"take":[59],"advantage":[60],"clusters":[62],"most":[63],"programs":[65],"extensive":[67],"modifications":[68],"so":[69],"that":[70,84],"they":[71],"run":[72],"efficiently":[73],"on":[74,94,159,173],"cache-based":[75,136],"microprocessor":[76],"systems.":[77],"This":[78],"paper":[79,112],"presents":[80],"techniques":[81],"tools":[83],"we":[85],"have":[86],"developed":[87],"used":[89],"optimize":[91],"solvers":[93],"a":[95,99,144,160,174],"single":[96,161],"node":[97],"cluster":[101],"through":[102,122],"example":[104],"code":[106,116,134,172],"DNSTool.":[107],"After":[108],"describing":[109],"DNSTool,":[110],"demonstrates":[113],"how":[114],"this":[115],"tuned":[118],"improve":[120],"performance":[121,169],"profiling":[123],"cost":[126,158],"each":[128],"subroutines,":[131],"adapting":[132],"memory":[137],"systems,":[138],"including":[140],"SWAR":[141],"(SIMD":[142],"within":[143],"register)":[145],"based":[146],"routines.":[147],"The":[148],"effect":[149],"improvements":[152],"halve":[155],"node,":[162],"which":[163],"turn":[165],"significantly":[166],"increases":[167],"cluster.":[176]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
