{"id":"https://openalex.org/W2170507620","doi":"https://doi.org/10.1002/cpe.3248","title":"Initial results on computational performance of Intel many integrated core, sandy bridge, and graphical processing unit architectures: implementation of a 1D c++/OpenMP electrostatic particle\u2010in\u2010cell code","display_name":"Initial results on computational performance of Intel many integrated core, sandy bridge, and graphical processing unit architectures: implementation of a 1D c++/OpenMP electrostatic particle\u2010in\u2010cell code","publication_year":2014,"publication_date":"2014-03-06","ids":{"openalex":"https://openalex.org/W2170507620","doi":"https://doi.org/10.1002/cpe.3248","mag":"2170507620"},"language":"en","primary_location":{"id":"doi:10.1002/cpe.3248","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.3248","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041579136","display_name":"A. Vapirev","orcid":null},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]},{"id":"https://openalex.org/I4210116480","display_name":"Flanders Make (Belgium)","ror":"https://ror.org/02ndjfz59","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210116480"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"A. Vapirev","raw_affiliation_strings":["Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","Intel ExaScience Lab  Kapeldreef 75 B\u20103001 Leuven Belgium","Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium","Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","institution_ids":["https://openalex.org/I99464096","https://openalex.org/I4210116480"]},{"raw_affiliation_string":"Intel ExaScience Lab  Kapeldreef 75 B\u20103001 Leuven Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087550900","display_name":"Jan Deca","orcid":"https://orcid.org/0000-0002-2272-9818"},"institutions":[{"id":"https://openalex.org/I4210116480","display_name":"Flanders Make (Belgium)","ror":"https://ror.org/02ndjfz59","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210116480"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"J. Deca","raw_affiliation_strings":["Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","institution_ids":["https://openalex.org/I99464096","https://openalex.org/I4210116480"]},{"raw_affiliation_string":"Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium","institution_ids":["https://openalex.org/I99464096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065740298","display_name":"Giovanni Lapenta","orcid":"https://orcid.org/0000-0002-3123-4024"},"institutions":[{"id":"https://openalex.org/I4210116480","display_name":"Flanders Make (Belgium)","ror":"https://ror.org/02ndjfz59","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210116480"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"G. Lapenta","raw_affiliation_strings":["Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics KU Leuven  Celestijnenlaan 200b bus 2400 Heverlee 3001 Belgium","institution_ids":["https://openalex.org/I99464096","https://openalex.org/I4210116480"]},{"raw_affiliation_string":"Department of Mathematics, KU Leuven, Celestijnenlaan 200b bus 2400, Heverlee 3001, Belgium","institution_ids":["https://openalex.org/I99464096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085178088","display_name":"Stefano Markidis","orcid":"https://orcid.org/0000-0003-0639-0639"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"S. Markidis","raw_affiliation_strings":["PDC Centre, KTH Royal Institute of Technology  Stockholm Sweden","PDC Centre, KTH Royal Institute of Technology, Stockholm, Sweden"],"affiliations":[{"raw_affiliation_string":"PDC Centre, KTH Royal Institute of Technology  Stockholm Sweden","institution_ids":["https://openalex.org/I86987016"]},{"raw_affiliation_string":"PDC Centre, KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047397553","display_name":"Ibrahim Hur","orcid":"https://orcid.org/0009-0003-8375-3963"},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"I. Hur","raw_affiliation_strings":["Intel ExaScience Lab  Kapeldreef 75 B\u20103001 Leuven Belgium","Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"Intel ExaScience Lab  Kapeldreef 75 B\u20103001 Leuven Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109159644","display_name":"J.\u2010L. Cambier","orcid":null},"institutions":[{"id":"https://openalex.org/I4210089296","display_name":"Edwards Air Force Base","ror":"https://ror.org/0079vgv93","country_code":"US","type":"other","lineage":["https://openalex.org/I1330347796","https://openalex.org/I4210089296","https://openalex.org/I4210089612","https://openalex.org/I4210102105"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J.\u2010L. Cambier","raw_affiliation_strings":["AFRL/PRSA, Edwards AFB  California 93524 USA","AFRL/PRSA, Edwards AFB, California 93524, USA"],"affiliations":[{"raw_affiliation_string":"AFRL/PRSA, Edwards AFB  California 93524 USA","institution_ids":["https://openalex.org/I4210089296"]},{"raw_affiliation_string":"AFRL/PRSA, Edwards AFB, California 93524, USA","institution_ids":["https://openalex.org/I4210089296"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5041579136"],"corresponding_institution_ids":["https://openalex.org/I4210116480","https://openalex.org/I99464096"],"apc_list":{"value":4740,"currency":"USD","value_usd":4740},"apc_paid":null,"fwci":0.613,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.71509668,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"27","issue":"3","first_page":"581","last_page":"593"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8976446390151978},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8359737396240234},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7843754887580872},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.7381873726844788},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.6569817662239075},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6499764323234558},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.6022130250930786},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.4733175039291382},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.457516610622406},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4434537887573242},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.4154356122016907},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15077131986618042},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.12538611888885498}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8976446390151978},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8359737396240234},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7843754887580872},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7381873726844788},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.6569817662239075},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6499764323234558},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.6022130250930786},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.4733175039291382},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.457516610622406},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4434537887573242},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.4154356122016907},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15077131986618042},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.12538611888885498}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1002/cpe.3248","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.3248","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W50182133","https://openalex.org/W1532125006","https://openalex.org/W1539676025","https://openalex.org/W1558008742","https://openalex.org/W1609496979","https://openalex.org/W1619439060","https://openalex.org/W1629852946","https://openalex.org/W1672666614","https://openalex.org/W1988888548","https://openalex.org/W2041978216","https://openalex.org/W2046020177","https://openalex.org/W2060096673","https://openalex.org/W2061296035","https://openalex.org/W2079227192","https://openalex.org/W2079777558","https://openalex.org/W2105901579","https://openalex.org/W2108694808","https://openalex.org/W2138782497","https://openalex.org/W2147743629","https://openalex.org/W2165805492","https://openalex.org/W2166298995","https://openalex.org/W2264044109","https://openalex.org/W3048087219","https://openalex.org/W3094616800","https://openalex.org/W3103487675","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W1908180445","https://openalex.org/W2213533160","https://openalex.org/W2035419609","https://openalex.org/W3203561460","https://openalex.org/W4252450863","https://openalex.org/W2467043670","https://openalex.org/W187726678","https://openalex.org/W2051078434","https://openalex.org/W4294342484","https://openalex.org/W2022867993"],"abstract_inverted_index":{"Summary":[0],"We":[1,36,79],"present":[2],"initial":[3,180],"comparison":[4],"performance":[5],"results":[6,93],"for":[7,41,75,104,127,141,153,164,171],"Intel":[8],"many":[9],"integrated":[10],"core":[11],"(MIC),":[12],"Sandy":[13],"Bridge":[14],"(SB),":[15],"and":[16,46,63,87,108,157,173],"graphical":[17],"processing":[18],"unit":[19],"(GPU).":[20],"A":[21],"1D":[22],"explicit":[23],"electrostatic":[24],"particle\u2010in\u2010cell":[25],"code":[26,73,187],"is":[27,51,68,98,148,195],"used":[28],"to":[29,84,134,182,188],"simulate":[30],"a":[31,56,105,154,205],"two\u2010stream":[32],"instability":[33],"in":[34],"plasma.":[35],"compare":[37],"the":[38,66,72,81,96,115,128,139,146,177,186,189,202],"computation":[39],"times":[40,100,126,136,151],"various":[42,85],"number":[43,59,116,198],"of":[44,60,117,161,185,199],"cores/threads":[45],"compiler":[47,90],"options.":[48,91],"The":[49,124,167],"parallelization":[50],"implemented":[52],"via":[53],"OpenMP":[54],"with":[55,70,77,120,144],"maximum":[57],"thread":[58,156],"128.":[61],"Parallelization":[62],"vectorization":[64,121],"on":[65],"GPU":[67,129,147,174],"achieved":[69],"modifying":[71],"syntax":[74],"compatibility":[76],"CUDA.":[78],"assess":[80],"speedup":[82,203],"due":[83],"auto\u2010vectorization":[86],"optimization":[88],"level":[89],"Our":[92],"show":[94],"that":[95,193],"MIC":[97,172,190],"several":[99],"slower":[101],"than":[102,112,138],"SB":[103,113],"single":[106,155],"thread,":[107],"it":[109],"becomes":[110],"faster":[111,137,152,163],"when":[114],"cores":[118],"increases":[119],"switched":[122],"on.":[123],"compute":[125],"are":[130,175],"consistently":[131],"about":[132,149,158],"six":[133],"seven":[135],"ones":[140],"MIC.":[142],"Compared":[143],"SB,":[145],"two":[150],"an":[159,196],"order":[160],"magnitude":[162],"128":[165],"threads.":[166],"net":[168],"speedup,":[169],"however,":[170],"almost":[176],"same.":[178],"An":[179],"attempt":[181],"offload":[183],"parts":[184],"coprocessor":[191],"shows":[192],"there":[194],"optimal":[197],"threads":[200],"where":[201],"reaches":[204],"maximum.":[206],"Copyright":[207],"\u00a9":[208],"2014":[209],"John":[210],"Wiley":[211],"&amp;":[212],"Sons,":[213],"Ltd.":[214]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
