{"id":"https://openalex.org/W2508492666","doi":"https://doi.org/10.1109/tpds.2016.2599527","title":"Model-Based Optimization of EULAG Kernel on Intel Xeon Phi Through Load Imbalancing","display_name":"Model-Based Optimization of EULAG Kernel on Intel Xeon Phi Through Load Imbalancing","publication_year":2016,"publication_date":"2016-08-11","ids":{"openalex":"https://openalex.org/W2508492666","doi":"https://doi.org/10.1109/tpds.2016.2599527","mag":"2508492666"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2016.2599527","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2599527","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084068586","display_name":"Alexey Lastovetsky","orcid":"https://orcid.org/0000-0001-9460-3897"},"institutions":[{"id":"https://openalex.org/I100930933","display_name":"University College Dublin","ror":"https://ror.org/05m7pjf47","country_code":"IE","type":"education","lineage":["https://openalex.org/I100930933"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Alexey Lastovetsky","raw_affiliation_strings":["School of Computer Science, University College Dublin, Belfield, Dublin 4, Ireland"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, University College Dublin, Belfield, Dublin 4, Ireland","institution_ids":["https://openalex.org/I100930933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033643387","display_name":"\u0141ukasz Szustak","orcid":"https://orcid.org/0000-0001-7429-6981"},"institutions":[{"id":"https://openalex.org/I130294970","display_name":"Cz\u0119stochowa University of Technology","ror":"https://ror.org/046awyn59","country_code":"PL","type":"education","lineage":["https://openalex.org/I130294970"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Lukasz Szustak","raw_affiliation_strings":["Czestochowa University of Technology, Dabrowskiego 69, Czestochowa, Poland"],"affiliations":[{"raw_affiliation_string":"Czestochowa University of Technology, Dabrowskiego 69, Czestochowa, Poland","institution_ids":["https://openalex.org/I130294970"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001502834","display_name":"Roman Wyrzykowski","orcid":"https://orcid.org/0000-0003-0328-2034"},"institutions":[{"id":"https://openalex.org/I130294970","display_name":"Cz\u0119stochowa University of Technology","ror":"https://ror.org/046awyn59","country_code":"PL","type":"education","lineage":["https://openalex.org/I130294970"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Roman Wyrzykowski","raw_affiliation_strings":["Czestochowa University of Technology, Dabrowskiego 69, Czestochowa, Poland"],"affiliations":[{"raw_affiliation_string":"Czestochowa University of Technology, Dabrowskiego 69, Czestochowa, Poland","institution_ids":["https://openalex.org/I130294970"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5084068586"],"corresponding_institution_ids":["https://openalex.org/I100930933"],"apc_list":null,"apc_paid":null,"fwci":8.1987,"has_fulltext":false,"cited_by_count":42,"citation_normalized_percentile":{"value":0.98222682,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"28","issue":"3","first_page":"787","last_page":"797"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8692834377288818},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.8052355647087097},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7342981696128845},{"id":"https://openalex.org/keywords/load-balancing","display_name":"Load balancing (electrical power)","score":0.5969763994216919},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5568340420722961},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.5149484276771545},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.49324434995651245},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4332638382911682},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1673029065132141},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.15893927216529846}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8692834377288818},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.8052355647087097},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7342981696128845},{"id":"https://openalex.org/C138959212","wikidata":"https://www.wikidata.org/wiki/Q1806783","display_name":"Load balancing (electrical power)","level":3,"score":0.5969763994216919},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5568340420722961},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.5149484276771545},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.49324434995651245},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4332638382911682},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1673029065132141},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.15893927216529846},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2016.2599527","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2599527","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1766076957","display_name":null,"funder_award_id":"14/IA/2474","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"},{"id":"https://openalex.org/G2305785772","display_name":null,"funder_award_id":"UMO-2015/17/D/ST6/04059","funder_id":"https://openalex.org/F4320322511","funder_display_name":"Narodowe Centrum Nauki"},{"id":"https://openalex.org/G4455644330","display_name":null,"funder_award_id":"IC1305","funder_id":"https://openalex.org/F4320320366","funder_display_name":"European Cooperation in Science and Technology"},{"id":"https://openalex.org/G7539838387","display_name":null,"funder_award_id":"UMO-2011/03/B/ST6/03500","funder_id":"https://openalex.org/F4320322511","funder_display_name":"Narodowe Centrum Nauki"}],"funders":[{"id":"https://openalex.org/F4320320366","display_name":"European Cooperation in Science and Technology","ror":"https://ror.org/01bstzn19"},{"id":"https://openalex.org/F4320320847","display_name":"Science Foundation Ireland","ror":"https://ror.org/0271asj38"},{"id":"https://openalex.org/F4320322511","display_name":"Narodowe Centrum Nauki","ror":"https://ror.org/03ha2q922"},{"id":"https://openalex.org/F4320322691","display_name":"Politechnika Czestochowska","ror":"https://ror.org/046awyn59"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W289665274","https://openalex.org/W1522241184","https://openalex.org/W1528000468","https://openalex.org/W1573276610","https://openalex.org/W1650934639","https://openalex.org/W1794165208","https://openalex.org/W1795008753","https://openalex.org/W1865195249","https://openalex.org/W1908022351","https://openalex.org/W1972883104","https://openalex.org/W1972922682","https://openalex.org/W1992326621","https://openalex.org/W1997147891","https://openalex.org/W2003094427","https://openalex.org/W2028798345","https://openalex.org/W2032906028","https://openalex.org/W2037274813","https://openalex.org/W2040015943","https://openalex.org/W2067052471","https://openalex.org/W2075022716","https://openalex.org/W2081422957","https://openalex.org/W2093326633","https://openalex.org/W2102624126","https://openalex.org/W2109426995","https://openalex.org/W2113119840","https://openalex.org/W2116367043","https://openalex.org/W2119042753","https://openalex.org/W2122570236","https://openalex.org/W2122619936","https://openalex.org/W2123031400","https://openalex.org/W2125980577","https://openalex.org/W2142421493","https://openalex.org/W2150476673","https://openalex.org/W2152509970","https://openalex.org/W2154786353","https://openalex.org/W2154790372","https://openalex.org/W2170611190","https://openalex.org/W2171473263","https://openalex.org/W2278129015","https://openalex.org/W2286735113","https://openalex.org/W2397581384","https://openalex.org/W2397644582","https://openalex.org/W2401335561","https://openalex.org/W2964101311","https://openalex.org/W3099022356","https://openalex.org/W3137957122","https://openalex.org/W3152199537","https://openalex.org/W4244789640","https://openalex.org/W4249968602","https://openalex.org/W4256084543","https://openalex.org/W4294628664","https://openalex.org/W6676762588","https://openalex.org/W6684857869","https://openalex.org/W6695135304","https://openalex.org/W6712610075","https://openalex.org/W6842480490"],"related_works":["https://openalex.org/W1974923383","https://openalex.org/W2475524688","https://openalex.org/W2739740241","https://openalex.org/W2085105049","https://openalex.org/W2526069705","https://openalex.org/W2024016913","https://openalex.org/W2019153376","https://openalex.org/W2981664121","https://openalex.org/W2796552083","https://openalex.org/W2949197156"],"abstract_inverted_index":{"Load":[0],"balancing":[1],"is":[2],"a":[3,90,104,122],"widely":[4],"accepted":[5],"technique":[6],"for":[7,76],"performance":[8,55,69,83,101,125,144,182],"optimization":[9,52,126,170],"of":[10,28,38,47,53,56,71,124,127,136,146,163,171,183],"scientific":[11,92,128],"applications":[12,18,129],"on":[13,24,103,117,173],"parallel":[14,57,106,138],"architectures.":[15],"Indeed,":[16],"balanced":[17],"do":[19],"not":[20,158],"waste":[21],"processor":[22],"cycles":[23],"waiting":[25],"at":[26],"points":[27],"synchronization":[29],"and":[30],"data":[31,137],"exchange,":[32],"maximizing":[33],"this":[34,41,118,167,184],"way":[35],"the":[36,45,48,54,68,77,134,140,147,161,181,196],"utilization":[37],"processors.":[39,164],"In":[40,133],"paper,":[42],"we":[43,60,88,120],"challenge":[44],"universality":[46],"load-balancing":[49],"approach":[50],"to":[51,79,97,149,169],"applications.":[58],"First,":[59],"formulate":[61],"conditions":[62],"that":[63,99,152,180],"should":[64],"be":[65,190],"satisfied":[66],"by":[67,193],"profile":[70,102],"an":[72],"application":[73,78,148,188],"in":[74],"order":[75],"achieve":[80],"its":[81,100,154],"best":[82],"via":[84],"load":[85,131,162],"balancing.":[86],"Then":[87],"use":[89],"real-life":[91],"application,":[93,139],"EULAG":[94],"MPDATA":[95,172],"kernel,":[96],"demonstrate":[98,179],"modern":[105],"architecture,":[107],"Intel":[108,174],"Xeon":[109,175],"Phi,":[110],"significantly":[111],"deviates":[112],"from":[113],"these":[114],"conditions.":[115],"Based":[116],"observation,":[119],"propose":[121],"method":[123,141,168],"through":[130],"imbalancing.":[132],"case":[135],"uses":[142],"functional":[143],"models":[145],"find":[150],"partitioning":[151],"minimizes":[153],"computation":[155],"time":[156],"but":[157],"necessarily":[159],"balances":[160],"We":[165],"apply":[166],"Phi.":[176],"Experimental":[177],"results":[178],"carefully":[185],"optimized":[186],"load-balanced":[187],"can":[189],"further":[191],"improved":[192],"15percent":[194],"using":[195],"proposed":[197],"load-imbalancing":[198],"technique.":[199]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":15},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
