{"id":"https://openalex.org/W4223535258","doi":"https://doi.org/10.1007/s11227-022-04473-9","title":"Investigating the effect of varying block size on power and energy consumption of GPU kernels","display_name":"Investigating the effect of varying block size on power and energy consumption of GPU kernels","publication_year":2022,"publication_date":"2022-04-10","ids":{"openalex":"https://openalex.org/W4223535258","doi":"https://doi.org/10.1007/s11227-022-04473-9"},"language":"en","primary_location":{"id":"doi:10.1007/s11227-022-04473-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-022-04473-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-022-04473-9.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11227-022-04473-9.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023977723","display_name":"Muhammad Jawad Ikram","orcid":"https://orcid.org/0000-0001-9340-9777"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Muhammad Jawad Ikram","raw_affiliation_strings":["Jeddah International College, Jeddah, 23831, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"Jeddah International College, Jeddah, 23831, Saudi Arabia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111390714","display_name":"Mostafa Elsayed Saleh","orcid":null},"institutions":[{"id":"https://openalex.org/I185163786","display_name":"King Abdulaziz University","ror":"https://ror.org/02ma4wv74","country_code":"SA","type":"education","lineage":["https://openalex.org/I185163786"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Mostafa Elsayed Saleh","raw_affiliation_strings":["King Abdulaziz University, Jeddah, 21589, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"King Abdulaziz University, Jeddah, 21589, Saudi Arabia","institution_ids":["https://openalex.org/I185163786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054076510","display_name":"Muhammad Al-Hashimi","orcid":null},"institutions":[{"id":"https://openalex.org/I185163786","display_name":"King Abdulaziz University","ror":"https://ror.org/02ma4wv74","country_code":"SA","type":"education","lineage":["https://openalex.org/I185163786"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Muhammad Abdulhamid Al-Hashimi","raw_affiliation_strings":["King Abdulaziz University, Jeddah, 21589, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"King Abdulaziz University, Jeddah, 21589, Saudi Arabia","institution_ids":["https://openalex.org/I185163786"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009812781","display_name":"Osama Ahmed Abulnaja","orcid":"https://orcid.org/0000-0003-3431-6890"},"institutions":[{"id":"https://openalex.org/I185163786","display_name":"King Abdulaziz University","ror":"https://ror.org/02ma4wv74","country_code":"SA","type":"education","lineage":["https://openalex.org/I185163786"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Osama Ahmed Abulnaja","raw_affiliation_strings":["King Abdulaziz University, Jeddah, 21589, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"King Abdulaziz University, Jeddah, 21589, Saudi Arabia","institution_ids":["https://openalex.org/I185163786"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5023977723"],"corresponding_institution_ids":[],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":1.4004,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.7884719,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"78","issue":"13","first_page":"14919","last_page":"14939"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8929965496063232},{"id":"https://openalex.org/keywords/exascale-computing","display_name":"Exascale computing","score":0.6566565036773682},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.6521451473236084},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.6185050010681152},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6099605560302734},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.6058525443077087},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5731731057167053},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.46997660398483276},{"id":"https://openalex.org/keywords/power-consumption","display_name":"Power consumption","score":0.46747586131095886},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.463125079870224},{"id":"https://openalex.org/keywords/block-size","display_name":"Block size","score":0.46279263496398926},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.4450989365577698},{"id":"https://openalex.org/keywords/graphics-processing-unit","display_name":"Graphics processing unit","score":0.4262595772743225},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.3749004602432251},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.27003049850463867},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.12238302826881409},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.06724774837493896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8929965496063232},{"id":"https://openalex.org/C2778837361","wikidata":"https://www.wikidata.org/wiki/Q2450880","display_name":"Exascale computing","level":3,"score":0.6566565036773682},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.6521451473236084},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.6185050010681152},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6099605560302734},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.6058525443077087},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5731731057167053},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.46997660398483276},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.46747586131095886},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.463125079870224},{"id":"https://openalex.org/C41431624","wikidata":"https://www.wikidata.org/wiki/Q1053357","display_name":"Block size","level":3,"score":0.46279263496398926},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.4450989365577698},{"id":"https://openalex.org/C2779851693","wikidata":"https://www.wikidata.org/wiki/Q183484","display_name":"Graphics processing unit","level":2,"score":0.4262595772743225},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.3749004602432251},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.27003049850463867},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.12238302826881409},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.06724774837493896},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11227-022-04473-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-022-04473-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-022-04473-9.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11227-022-04473-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-022-04473-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-022-04473-9.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.9100000262260437,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G3396093235","display_name":null,"funder_award_id":"1-611-1433/HiCi","funder_id":"https://openalex.org/F4320322322","funder_display_name":"King Abdulaziz University"},{"id":"https://openalex.org/G6371580928","display_name":null,"funder_award_id":"1-611-1433/HiCi.","funder_id":"https://openalex.org/F4320335726","funder_display_name":"Deanship of Scientific Research, King Saud University"}],"funders":[{"id":"https://openalex.org/F4320322322","display_name":"King Abdulaziz University","ror":"https://ror.org/02ma4wv74"},{"id":"https://openalex.org/F4320335726","display_name":"Deanship of Scientific Research, King Saud University","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4223535258.pdf","grobid_xml":"https://content.openalex.org/works/W4223535258.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W1549218039","https://openalex.org/W1859126261","https://openalex.org/W1978969737","https://openalex.org/W2014555481","https://openalex.org/W2029822446","https://openalex.org/W2034140701","https://openalex.org/W2038122178","https://openalex.org/W2043083835","https://openalex.org/W2045231673","https://openalex.org/W2066804546","https://openalex.org/W2078237010","https://openalex.org/W2081871260","https://openalex.org/W2083117011","https://openalex.org/W2091543319","https://openalex.org/W2095909712","https://openalex.org/W2102074146","https://openalex.org/W2106938618","https://openalex.org/W2122297544","https://openalex.org/W2135120170","https://openalex.org/W2141389982","https://openalex.org/W2144293278","https://openalex.org/W2149921618","https://openalex.org/W2282141805","https://openalex.org/W2479666647","https://openalex.org/W2522820499","https://openalex.org/W2609709374","https://openalex.org/W2727655179","https://openalex.org/W2743822064","https://openalex.org/W2792743882","https://openalex.org/W2886926031","https://openalex.org/W2903597723","https://openalex.org/W2936165747","https://openalex.org/W2972074918","https://openalex.org/W3007482080","https://openalex.org/W3081880813","https://openalex.org/W3134760666","https://openalex.org/W3206283723","https://openalex.org/W4239291609"],"related_works":["https://openalex.org/W2151046618","https://openalex.org/W1972148443","https://openalex.org/W1969233021","https://openalex.org/W2167646277","https://openalex.org/W2063573318","https://openalex.org/W2388314963","https://openalex.org/W3158047141","https://openalex.org/W1656096860","https://openalex.org/W2027443981","https://openalex.org/W151175334"],"abstract_inverted_index":{"Abstract":[0],"Power":[1],"consumption":[2],"is":[3],"likely":[4],"to":[5,33,121],"remain":[6],"a":[7,41,50,114],"significant":[8],"concern":[9],"for":[10,29,140],"exascale":[11,30,142],"performance":[12,36],"in":[13,82,144],"the":[14,60,79,83,97,103,123],"foreseeable":[15],"future.":[16],"In":[17,40,64],"addition,":[18],"graphics":[19],"processing":[20],"units":[21],"(GPUs)":[22],"have":[23],"become":[24],"an":[25],"accepted":[26],"architectural":[27],"feature":[28],"computing":[31],"due":[32],"their":[34],"scalable":[35],"and":[37,55,75,117,132,148],"power":[38,54,74,131,147],"efficiency.":[39,150],"recent":[42],"study,":[43],"we":[44,47,67,70,90],"found":[45],"that":[46,69,89],"can":[48,71],"achieve":[49],"reasonable":[51],"amount":[52],"of":[53,62,125,146],"energy":[56,76,133,149],"savings":[57,94],"based":[58],"on":[59,109,129],"selection":[61],"algorithms.":[63],"this":[65],"research,":[66],"suggest":[68],"save":[72],"more":[73,93],"by":[77,95],"varying":[78,126],"block":[80,99,127],"size":[81,100],"kernel":[84],"configuration":[85],".":[86],"We":[87,105],"show":[88],"may":[91],"attain":[92],"selecting":[96],"optimum":[98],"while":[101],"executing":[102],"workload.":[104],"investigated":[106],"two":[107],"kernels":[108],"NVIDIA":[110],"Tesla":[111],"K40":[112],"GPU,":[113],"Bitonic":[115],"Mergesort":[116],"Vector":[118],"Addition":[119],"kernels,":[120],"study":[122,136],"effect":[124],"sizes":[128],"GPU":[130],"consumption.":[134],"The":[135],"should":[137],"offer":[138],"insights":[139],"upcoming":[141],"systems":[143],"terms":[145]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
