{"id":"https://openalex.org/W4233727745","doi":"https://doi.org/10.1177/1094342009359258","title":"The Importance of Non-Data-Communication Overheads in MPI","display_name":"The Importance of Non-Data-Communication Overheads in MPI","publication_year":2010,"publication_date":"2010-02-01","ids":{"openalex":"https://openalex.org/W4233727745","doi":"https://doi.org/10.1177/1094342009359258"},"language":"en","primary_location":{"id":"doi:10.1177/1094342009359258","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342009359258","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050531633","display_name":"Pavan Balaji","orcid":null},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"P. Balaji","raw_affiliation_strings":["MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA, [email\u00a0protected]"],"affiliations":[{"raw_affiliation_string":"MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA, [email\u00a0protected]","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032472515","display_name":"Anthony Chan","orcid":"https://orcid.org/0000-0002-4574-5685"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"A. Chan","raw_affiliation_strings":["MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,. [email\u00a0protected]"],"affiliations":[{"raw_affiliation_string":"MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,. [email\u00a0protected]","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017241944","display_name":"William Gropp","orcid":"https://orcid.org/0000-0003-2905-3029"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"W. Gropp","raw_affiliation_strings":["DEPARTMENT OF COMPUTER SCIENCE, UNIVERSITY OF ILLINOIS, URBANA, IL 61801, USA, [email\u00a0protected]"],"affiliations":[{"raw_affiliation_string":"DEPARTMENT OF COMPUTER SCIENCE, UNIVERSITY OF ILLINOIS, URBANA, IL 61801, USA, [email\u00a0protected]","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014920685","display_name":"Rajeev Thakur","orcid":"https://orcid.org/0000-0002-5532-3048"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"R. Thakur","raw_affiliation_strings":["MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,[email\u00a0protected]"],"affiliations":[{"raw_affiliation_string":"MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,[email\u00a0protected]","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111494129","display_name":"Ewing Lusk","orcid":null},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"E. Lusk","raw_affiliation_strings":["MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,[email\u00a0protected]"],"affiliations":[{"raw_affiliation_string":"MATHEMATICS AND COMPUTER SCIENCE DIVISION, ARGONNE NATIONAL LABORATORY, ARGONNE, IL 60439, USA,[email\u00a0protected]","institution_ids":["https://openalex.org/I1282105669"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5014920685","https://openalex.org/A5017241944","https://openalex.org/A5032472515","https://openalex.org/A5050531633","https://openalex.org/A5111494129"],"corresponding_institution_ids":["https://openalex.org/I1282105669"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37766214,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"24","issue":"1","first_page":"5","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12326","display_name":"Network Packet Processing and Optimization","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8534855842590332},{"id":"https://openalex.org/keywords/serialization","display_name":"Serialization","score":0.679577112197876},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6106348633766174},{"id":"https://openalex.org/keywords/message-passing-interface","display_name":"Message Passing Interface","score":0.5717374086380005},{"id":"https://openalex.org/keywords/stack","display_name":"Stack (abstract data type)","score":0.5224629640579224},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.5023467540740967},{"id":"https://openalex.org/keywords/message-queue","display_name":"Message queue","score":0.4900778532028198},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4880024492740631},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.4771439731121063},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.4111071825027466},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3740115761756897},{"id":"https://openalex.org/keywords/message-passing","display_name":"Message passing","score":0.3634995222091675},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.30996960401535034},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.22682660818099976}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8534855842590332},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.679577112197876},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6106348633766174},{"id":"https://openalex.org/C166782233","wikidata":"https://www.wikidata.org/wiki/Q127879","display_name":"Message Passing Interface","level":3,"score":0.5717374086380005},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.5224629640579224},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.5023467540740967},{"id":"https://openalex.org/C26324664","wikidata":"https://www.wikidata.org/wiki/Q1065525","display_name":"Message queue","level":2,"score":0.4900778532028198},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4880024492740631},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.4771439731121063},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.4111071825027466},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3740115761756897},{"id":"https://openalex.org/C854659","wikidata":"https://www.wikidata.org/wiki/Q1859284","display_name":"Message passing","level":2,"score":0.3634995222091675},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.30996960401535034},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.22682660818099976},{"id":"https://openalex.org/C129307140","wikidata":"https://www.wikidata.org/wiki/Q6795880","display_name":"Maximum bubble pressure method","level":3,"score":0.0},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/1094342009359258","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342009359258","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of High Performance Computing Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8700000047683716,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2355322892","https://openalex.org/W2124048060","https://openalex.org/W1902983110","https://openalex.org/W2378910916","https://openalex.org/W4386915331","https://openalex.org/W2116006827","https://openalex.org/W2086666199","https://openalex.org/W1511717675","https://openalex.org/W2361929291","https://openalex.org/W2893723147"],"abstract_inverted_index":{"With":[0],"processor":[1],"speeds":[2],"no":[3],"longer":[4],"doubling":[5],"every":[6],"18\u201424":[7],"months":[8],"owing":[9],"to":[10,25,157],"the":[11,29,44,74,86,108,113,117,130,144,161,167,171,181],"exponential":[12],"increase":[13],"in":[14,103,166,180],"power":[15],"consumption":[16],"and":[17,35,65,138,149],"heat":[18],"dissipation,":[19],"modern":[20],"high-end":[21],"computing":[22],"systems":[23,94],"tend":[24],"rely":[26,37],"less":[27],"on":[28,38,62,92,98,116,196],"performance":[30,41],"of":[31,46,50,83,127,136,160,170],"single":[32],"processing":[33,52,67],"units":[34],"instead":[36],"achieving":[39],"high":[40],"by":[42],"using":[43],"parallelism":[45],"a":[47,60,193],"massive":[48,198],"number":[49],"low-frequency/low-power":[51],"cores.":[53],"Using":[54],"such":[55,72,197],"low-frequency":[56],"cores,":[57],"however,":[58],"puts":[59],"premium":[61],"end-host":[63],"pre-":[64],"post-communication":[66],"required":[68],"within":[69,85,112,143],"communication":[70,87],"stacks,":[71],"as":[73],"Message":[75],"Passing":[76],"Interface":[77],"(MPI)":[78],"implementation.":[79],"Similarly,":[80],"small":[81],"amounts":[82],"serialization":[84],"stack":[88,132],"that":[89,154],"were":[90,185],"acceptable":[91],"small/medium":[93],"can":[95,191],"be":[96],"brutal":[97],"massively":[99],"parallel":[100],"systems.":[101,199],"Thus,":[102],"this":[104],"paper,":[105],"we":[106,123],"study":[107],"different":[109],"non-data-communication":[110],"overheads":[111,179],"MPI":[114,131,145,182],"implementation":[115],"IBM":[118],"Blue":[119,163],"Gene/P":[120,164],"system.":[121],"Specifically,":[122],"analyze":[124],"various":[125,150],"aspects":[126],"MPI,":[128],"including":[129],"overhead":[133,135],"itself,":[134],"allocating":[137],"queueing":[139],"requests,":[140],"queue":[141],"searches":[142],"stack,":[146,183],"multi-request":[147],"operations,":[148],"others.":[151],"Our":[152],"experiments,":[153],"scale":[155],"up":[156],"131,072":[158],"cores":[159],"largest":[162],"system":[165,173],"world":[168],"(80%":[169],"total":[172],"size),":[174],"reveal":[175],"several":[176],"insights":[177],"into":[178],"which":[184],"not":[186],"previously":[187],"considered":[188],"significant,":[189],"but":[190],"have":[192],"substantial":[194],"impact":[195]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
