{"id":"https://openalex.org/W2519479244","doi":"https://doi.org/10.1109/hpcsim.2016.7568453","title":"Energy consumption optimization of the Total-FETI solver and BLAS routines by changing the CPU frequency","display_name":"Energy consumption optimization of the Total-FETI solver and BLAS routines by changing the CPU frequency","publication_year":2016,"publication_date":"2016-07-01","ids":{"openalex":"https://openalex.org/W2519479244","doi":"https://doi.org/10.1109/hpcsim.2016.7568453","mag":"2519479244"},"language":"en","primary_location":{"id":"doi:10.1109/hpcsim.2016.7568453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcsim.2016.7568453","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Conference on High Performance Computing &amp; Simulation (HPCS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/10084/117100","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010762974","display_name":"David Hor\u00e1k","orcid":"https://orcid.org/0000-0001-8825-1944"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"David Horak","raw_affiliation_strings":["IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic"],"affiliations":[{"raw_affiliation_string":"IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021447319","display_name":"Lubom\u0131\u0301r \u0158\u0131\u0301ha","orcid":"https://orcid.org/0000-0002-1017-5766"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Lubomir Riha","raw_affiliation_strings":["IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic"],"affiliations":[{"raw_affiliation_string":"IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012842917","display_name":"Radim Sojka","orcid":null},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Radim Sojka","raw_affiliation_strings":["IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic"],"affiliations":[{"raw_affiliation_string":"IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052455594","display_name":"Jakub Kru\u017e\u00edk","orcid":"https://orcid.org/0000-0001-5448-837X"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Jakub Kruzik","raw_affiliation_strings":["IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic"],"affiliations":[{"raw_affiliation_string":"IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009660331","display_name":"Martin Beseda","orcid":"https://orcid.org/0000-0001-5792-2872"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Martin Beseda","raw_affiliation_strings":["IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic"],"affiliations":[{"raw_affiliation_string":"IT4Innovations National Supercomputing Center, VSB-Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5010762974"],"corresponding_institution_ids":["https://openalex.org/I142208455"],"apc_list":null,"apc_paid":null,"fwci":0.7181,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.77648828,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1031","last_page":"1032"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13612","display_name":"Advanced Scientific and Engineering Studies","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13612","display_name":"Advanced Scientific and Engineering Studies","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.814399242401123},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.7013192772865295},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.5177023410797119},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4878706932067871},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.4751819670200348},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.42055079340934753},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4194554090499878},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.40165847539901733},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.11668014526367188},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08337301015853882}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.814399242401123},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.7013192772865295},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.5177023410797119},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4878706932067871},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.4751819670200348},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.42055079340934753},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4194554090499878},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.40165847539901733},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.11668014526367188},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08337301015853882},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/hpcsim.2016.7568453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcsim.2016.7568453","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Conference on High Performance Computing &amp; Simulation (HPCS)","raw_type":"proceedings-article"},{"id":"pmh:oai:dspace.vsb.cz:10084/117100","is_oa":true,"landing_page_url":"http://hdl.handle.net/10084/117100","pdf_url":null,"source":{"id":"https://openalex.org/S4306401668","display_name":"DSpace V\u0160B-TUO (V\u0160B-TUO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I142208455","host_organization_name":"VSB - Technical University of Ostrava","host_organization_lineage":["https://openalex.org/I142208455"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conferenceObject"}],"best_oa_location":{"id":"pmh:oai:dspace.vsb.cz:10084/117100","is_oa":true,"landing_page_url":"http://hdl.handle.net/10084/117100","pdf_url":null,"source":{"id":"https://openalex.org/S4306401668","display_name":"DSpace V\u0160B-TUO (V\u0160B-TUO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I142208455","host_organization_name":"VSB - Technical University of Ostrava","host_organization_lineage":["https://openalex.org/I142208455"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conferenceObject"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.9100000262260437,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321005","display_name":"Ministerstvo \u0160kolstv\u00ed, Ml\u00e1de\u017ee a T\u011blov\u00fdchovy","ror":"https://ror.org/037n8p820"},{"id":"https://openalex.org/F4320321006","display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky","ror":"https://ror.org/01pv73b02"},{"id":"https://openalex.org/F4320337144","display_name":"National Supercomputing Center, Korea Institute of Science and Technology Information","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W1964847500","https://openalex.org/W2076978869","https://openalex.org/W2140639233","https://openalex.org/W2245464624","https://openalex.org/W4388319564"],"related_works":["https://openalex.org/W1582436825","https://openalex.org/W1604758548","https://openalex.org/W1996803181","https://openalex.org/W4367553810","https://openalex.org/W2104142636","https://openalex.org/W1549048322","https://openalex.org/W2804126825","https://openalex.org/W2011940952","https://openalex.org/W2731831065","https://openalex.org/W4283162424"],"abstract_inverted_index":{"The":[0,17,79,110,129,159,286,359,380,435,456,547],"energy":[1,22,37,72,157,172,192,221,283,444,483,491,553,580],"consumption":[2,23,38,73,193,222,492,554],"of":[3,7,19,40,51,75,96,102,179,186,194,216,223,228,297,387,432,482,515,555],"supercomputers":[4],"is":[5,24,60,91,246,403,418],"one":[6,271,571],"the":[8,12,36,41,71,76,83,94,97,115,165,177,184,187,191,195,207,214,220,224,229,250,260,269,278,289,328,339,345,349,362,377,401,411,416,421,426,429,433,468,475,551],"critical":[9],"problems":[10],"for":[11,64,105,150,198,333,338,344,384,484,585],"upcoming":[13],"Exascale":[14],"supercomputing":[15],"era.":[16],"awareness":[18],"power":[20,139,155],"an":[21,61,137,368],"required":[25],"on":[26,114,190,219,568],"both":[27],"software":[28],"and":[29,45,69,152,156,175,241,254,257,262,268,281,314,318,335,343,393,407,499,505,534,563],"hardware":[30],"side.":[31],"This":[32,89],"poster":[33,84,381,436],"deals":[34],"with":[35,70,86,371,496],"evaluation":[39,74],"Total-Finite":[42],"Element":[43],"Tearing":[44],"Interconnect":[46],"(TFETI)":[47],"based":[48,122,486],"solvers":[49],"[2]":[50],"linear":[52,200],"systems":[53],"implemented":[54],"in":[55,82,93,237,471],"PERMON":[56],"toolbox":[57],"[1],":[58],"which":[59,295],"established":[62],"method":[63],"solving":[65],"real-world":[66],"engineering":[67],"problems,":[68],"BLAS":[77,501,556],"routines.":[78,507],"experiments":[80],"performed":[81,92,113],"deal":[85],"CPU":[87,188,450],"frequency.":[88],"work":[90],"scope":[95],"READEX":[98],"project":[99],"(Runtime":[100],"Exploitation":[101],"Application":[103],"Dynamism":[104],"Energy-efficient":[106],"eXascale":[107],"computing)":[108],"[6].":[109],"measurements":[111,160,173],"were":[112,494],"Intel":[116,541],"Xeon":[117],"E5-2680":[118],"(Intel":[119],"Haswell":[120],"micro-architecture)":[121],"Taurus":[123],"system":[124,130,427],"installed":[125],"at":[126],"TU":[127],"Dresden.":[128],"contains":[131],"over":[132],"1400":[133],"nodes":[134],"that":[135,148,438],"have":[136,182,212,511,523],"FPGA-based":[138],"instrumentation":[140],"called":[141],"HDEEM":[142,166],"(High":[143],"Definition":[144],"Energy":[145],"Efficiency":[146],"Monitoring),":[147],"allows":[149],"fine-grained":[151],"more":[153,586],"accurate":[154],"measurements.":[158],"can":[161,572],"be":[162],"accessed":[163],"through":[164],"library,":[167],"allowing":[168],"developers":[169],"to":[170,248,258,272,277,326,424,428,448,464,477,480,577,583],"take":[171],"before":[174,405],"after":[176],"region":[178],"interest.":[180],"We":[181,522],"evaluated":[183,213],"effect":[185,215],"frequency":[189,217,388,402,417,575],"TFETI":[196,230,238,485],"solver":[197,330],"a":[199,513],"elasticity":[201],"3D":[202],"cube":[203],"synthetic":[204],"benchmark.":[205],"On":[206],"dualized":[208],"problem":[209,347],"MPFX=MPd,":[210],"we":[211,324,510],"tuning":[218,392,399,440,458],"essential":[225],"processing":[226],"kernels":[227],"method.":[231],"There":[232],"are":[233,561,565],"two":[234,385],"main":[235],"phases":[236],"-":[239],"preprocessing":[240,244],"solve.":[242],"In":[243,321,466],"it":[245,256],"necessary":[247],"regularize":[249],"stiffness":[251],"matrix":[252,366],"K":[253],"factorize":[255],"assemble":[259],"G":[261],"GG":[263],"<sup":[264,351,355],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[265,306,311,352,356],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">T</sup>":[266,353],"matrices":[267,516],"second":[270],"factorize.":[273],"Both":[274],"operations":[275,560],"belong":[276],"most":[279],"time":[280],"also":[282],"consuming":[284],"operations.":[285],"solve":[287],"employs":[288],"Preconditioned":[290],"Conjugate":[291],"Gradient":[292],"(PCG)":[293],"algorithm,":[294],"consists":[296],"sparse":[298],"matrix-vector":[299],"multiplications":[300],"(by":[301],"F,":[302],"P,":[303],"M":[304,309],"<sub":[305,310],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">L</sub>":[307],",":[308],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">D</sub>":[312],"matrices)":[313],"vector":[315],"dot":[316],"products":[317],"AXPY":[319],"functions.":[320],"each":[322],"iteration,":[323],"need":[325],"apply":[327],"direct":[329],"twice,":[331],"i.e.,":[332],"forward":[334],"backward":[336],"solves":[337],"pseudoinverse":[340],"K+":[341],"action":[342],"coarse":[346],"solution,":[348],"(GG":[350],")":[354],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">-1</sup>":[357],"action.":[358],"multiplication":[360,538],"by":[361,462],"dense":[363],"Schur":[364],"complement":[365],"adds":[367],"additional":[369],"operator":[370],"different":[372,552],"computational":[373],"characteristics,":[374],"potentially":[375],"increasing":[376],"exploitable":[378],"dynamism.":[379],"provides":[382],"results":[383],"types":[386],"tuning:":[389],"(1)":[390],"static":[391,398,439],"(2)":[394],"dynamic":[395,414,457,574],"tuning.":[396],"For":[397,413,508],"experiments,":[400],"set":[404,514],"execution":[406,423],"kept":[408],"constant":[409],"during":[410,420],"runtime.":[412],"tuning,":[415],"changed":[419],"program":[422],"adapt":[425],"actual":[430],"needs":[431],"application.":[434],"shows":[437,474],"brings":[441],"up":[442,463,479,582],"11.84%":[443],"savings":[445,581],"when":[446],"compared":[447],"default":[449],"settings":[451],"(the":[452],"highest":[453],"clock":[454],"rate).":[455],"improves":[459],"this":[460,472],"further":[461],"2.68%.":[465],"total,":[467],"approach":[469],"presented":[470],"paper":[473],"potential":[476],"save":[478],"14.52%":[481],"solvers,":[487],"see":[488,588],"Table1.":[489],"Another":[490],"evaluations":[493],"done":[495],"selected":[497],"Sparse":[498,526,528,535],"Dense":[500,530,532],"Level":[502],"1,":[503],"2":[504],"3":[506],"benchmarking":[509],"used":[512],"from":[517,540],"University":[518],"Florida":[519],"collection":[520],"[4].":[521],"employed":[524],"AXPY,":[525],"Matrix-Vector,":[527,531],"MatrixMatrix,":[529],"Matrix-Matrix":[533],"Matrix-Dense":[536],"Matrix":[537],"routines":[539],"Math":[542],"Kernel":[543],"Library":[544],"(MKL)":[545],"[3].":[546],"measured":[548],"characteristics":[549],"illustrate":[550],"routines,":[557],"as":[558],"some":[559],"memory-bounded":[562],"others":[564],"compute-bounded.":[566],"Based":[567],"our":[569],"recommendations":[570],"explore":[573],"switching":[576],"achieve":[578],"significant":[579],"23%,":[584],"details":[587],"Table":[589],"2.":[590]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
