{"id":"https://openalex.org/W2963721753","doi":"https://doi.org/10.1145/3291523","title":"New High Performance GPGPU Code Transformation Framework Applied to Large Production Weather Prediction Code","display_name":"New High Performance GPGPU Code Transformation Framework Applied to Large Production Weather Prediction Code","publication_year":2018,"publication_date":"2018-06-30","ids":{"openalex":"https://openalex.org/W2963721753","doi":"https://doi.org/10.1145/3291523","mag":"2963721753"},"language":"en","primary_location":{"id":"doi:10.1145/3291523","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3291523","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056055773","display_name":"Michel M\u00fcller","orcid":null},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Michel M\u00fcller","raw_affiliation_strings":["Tokyo Institute of Technology, Meguro-ku, Tokyo"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Meguro-ku, Tokyo","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083869087","display_name":"Takayuki Aoki","orcid":"https://orcid.org/0000-0003-1850-3469"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takayuki Aoki","raw_affiliation_strings":["Tokyo Institute of Technology, Meguro-ku, Tokyo"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Meguro-ku, Tokyo","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5056055773"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":0.5049,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.66010755,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"5","issue":"2","first_page":"1","last_page":"42"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10466","display_name":"Meteorological Phenomena and Simulations","score":0.9736999869346619,"subfield":{"id":"https://openalex.org/subfields/1902","display_name":"Atmospheric Science"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9686999917030334,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fortran","display_name":"Fortran","score":0.8133790493011475},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7420498728752136},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.675452709197998},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6592637300491333},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.5987821817398071},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.5052629113197327},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.49516454339027405},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.4850987195968628},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4410952627658844},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.4112374186515808},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.34655728936195374},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1819911003112793},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09457576274871826}],"concepts":[{"id":"https://openalex.org/C2778241615","wikidata":"https://www.wikidata.org/wiki/Q83303","display_name":"Fortran","level":2,"score":0.8133790493011475},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7420498728752136},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.675452709197998},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6592637300491333},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.5987821817398071},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.5052629113197327},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.49516454339027405},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.4850987195968628},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4410952627658844},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.4112374186515808},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.34655728936195374},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1819911003112793},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09457576274871826},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3291523","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3291523","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W76123042","https://openalex.org/W1774469134","https://openalex.org/W1820550104","https://openalex.org/W1964192298","https://openalex.org/W1999534369","https://openalex.org/W2002555321","https://openalex.org/W2022036382","https://openalex.org/W2032371590","https://openalex.org/W2058327612","https://openalex.org/W2058489233","https://openalex.org/W2074833026","https://openalex.org/W2075238266","https://openalex.org/W2078794610","https://openalex.org/W2099911225","https://openalex.org/W2111530316","https://openalex.org/W2112043279","https://openalex.org/W2114063275","https://openalex.org/W2117677968","https://openalex.org/W2127112348","https://openalex.org/W2153689314","https://openalex.org/W2166823841","https://openalex.org/W2167728712","https://openalex.org/W2482915108","https://openalex.org/W2559823574","https://openalex.org/W2766128385","https://openalex.org/W2963219561","https://openalex.org/W3021447659","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2739740241","https://openalex.org/W1974923383","https://openalex.org/W2085105049","https://openalex.org/W2475524688","https://openalex.org/W2148563915","https://openalex.org/W2526069705","https://openalex.org/W2024016913","https://openalex.org/W2019153376","https://openalex.org/W2981664121","https://openalex.org/W2796552083"],"abstract_inverted_index":{"We":[0],"introduce":[1],"\u201cHybrid":[2],"Fortran,\u201d":[3],"a":[4,9,25,31,52,68,83,95,125],"new":[5],"approach":[6],"that":[7,72],"allows":[8],"high-performance":[10],"GPGPU":[11,179],"port":[12,156],"for":[13,24],"structured":[14],"grid":[15,132],"Fortran":[16,78,99],"codes.":[17],"This":[18],"technique":[19],"only":[20],"requires":[21],"minimal":[22,69],"changes":[23],"CPU":[26,121],"targeted":[27],"codebase,":[28],"which":[29],"is":[30,79,101],"significant":[32],"advancement":[33],"in":[34,144],"terms":[35],"of":[36,50,63,67,181],"productivity.":[37],"It":[38],"has":[39],"been":[40],"successfully":[41],"applied":[42],"to":[43,81,103,159,176],"both":[44,82,119],"dynamical":[45],"core":[46],"and":[47,112,122,140],"physical":[48],"processes":[49],"ASUCA,":[51],"Japanese":[53],"mesoscale":[54],"weather":[55,70,142,183],"prediction":[56],"model":[57,85,118],"with":[58,116,133],"more":[59,161,177],"than":[60,110,162],"150k":[61],"lines":[62],"code.":[64],"By":[65],"means":[66],"application":[71],"resembles":[73],"ASUCA\u2019s":[74],"code":[75],"structure,":[76],"Hybrid":[77,98,153],"compared":[80],"performance":[84,109,114],"as":[86,88],"well":[87],"today\u2019s":[89],"commonly":[90],"used":[91],"method,":[92],"OpenACC.":[93],"As":[94],"result,":[96],"the":[97,105,117,152,171],"implementation":[100],"shown":[102,158],"deliver":[104],"same":[106],"or":[107],"better":[108],"OpenACC,":[111],"its":[113],"agrees":[115],"on":[120],"GPU.":[123],"In":[124],"full-scale":[126],"production":[127],"run,":[128],"using":[129],"an":[130],"ASUCA":[131],"1581":[134],"\u00d7":[135,137],"1301":[136],"58":[138],"cells":[139],"real-world":[141],"data":[143],"2km":[145],"resolution,":[146],"24":[147],"NVIDIA":[148],"Tesla":[149],"P100":[150],"running":[151,170],"Fortran\u2013based":[154],"GPU":[155],"are":[157],"replace":[160],"fifty":[163],"18-core":[164],"Intel":[165],"Xeon":[166],"Broadwell":[167],"E5-2695":[168],"v4":[169],"reference":[172],"implementation\u2014an":[173],"achievement":[174],"comparable":[175],"invasive":[178],"rewrites":[180],"other":[182],"models.":[184]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2018,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
