{"id":"https://openalex.org/W2099032432","doi":"https://doi.org/10.1109/ipdps.2009.5161092","title":"Application profiling on Cell-based clusters","display_name":"Application profiling on Cell-based clusters","publication_year":2009,"publication_date":"2009-05-01","ids":{"openalex":"https://openalex.org/W2099032432","doi":"https://doi.org/10.1109/ipdps.2009.5161092","mag":"2099032432"},"language":"en","primary_location":{"id":"doi:10.1109/ipdps.2009.5161092","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2009.5161092","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Symposium on Parallel &amp; Distributed Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072389428","display_name":"Hikmet Dursun","orcid":null},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]},{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hikmet Dursun","raw_affiliation_strings":["Collaboratory for Advanced Computing and Simulations, Department of Computer Science, University of Southern California, CA, USA","Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA"],"affiliations":[{"raw_affiliation_string":"Collaboratory for Advanced Computing and Simulations, Department of Computer Science, University of Southern California, CA, USA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA","institution_ids":["https://openalex.org/I1343871089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038062469","display_name":"Kevin Barker","orcid":"https://orcid.org/0000-0003-4947-0559"},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kevin J. Barker","raw_affiliation_strings":["Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA"],"affiliations":[{"raw_affiliation_string":"Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA","institution_ids":["https://openalex.org/I1343871089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064935199","display_name":"Darren J. Kerbyson","orcid":null},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Darren J. Kerbyson","raw_affiliation_strings":["Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA"],"affiliations":[{"raw_affiliation_string":"Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA","institution_ids":["https://openalex.org/I1343871089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060855642","display_name":"Scott Pakin","orcid":"https://orcid.org/0000-0002-5220-1985"},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Scott Pakin","raw_affiliation_strings":["Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA"],"affiliations":[{"raw_affiliation_string":"Performance and Architecture Laboratory (PAL), Computer Science for HPC (CCS-1), Los Alamos National Laboratory, NM, USA","institution_ids":["https://openalex.org/I1343871089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072389428"],"corresponding_institution_ids":["https://openalex.org/I1174212","https://openalex.org/I1343871089"],"apc_list":null,"apc_paid":null,"fwci":0.5355,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.67600038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"1225","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8566921949386597},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.8281441926956177},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.721708357334137},{"id":"https://openalex.org/keywords/petascale-computing","display_name":"Petascale computing","score":0.6660453081130981},{"id":"https://openalex.org/keywords/ibm","display_name":"IBM","score":0.6288074851036072},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.5065594911575317},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.48798054456710815},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.4666927456855774},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.46553292870521545},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.45335283875465393}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8566921949386597},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.8281441926956177},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.721708357334137},{"id":"https://openalex.org/C185410017","wikidata":"https://www.wikidata.org/wiki/Q7171778","display_name":"Petascale computing","level":3,"score":0.6660453081130981},{"id":"https://openalex.org/C70388272","wikidata":"https://www.wikidata.org/wiki/Q5968558","display_name":"IBM","level":2,"score":0.6288074851036072},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.5065594911575317},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.48798054456710815},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.4666927456855774},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.46553292870521545},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.45335283875465393},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C171250308","wikidata":"https://www.wikidata.org/wiki/Q11468","display_name":"Nanotechnology","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/ipdps.2009.5161092","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2009.5161092","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Symposium on Parallel &amp; Distributed Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.226.2402","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.226.2402","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.c3.lanl.gov/PAL/publications/papers/Dursun2009%3Aapp-profiling.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.406.9483","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.406.9483","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://cacs.usc.edu/papers/hdursun_LSPP_ID2030.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320338304","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W26331760","https://openalex.org/W566145378","https://openalex.org/W1480147318","https://openalex.org/W1567629145","https://openalex.org/W1580800534","https://openalex.org/W2039765803","https://openalex.org/W2051598123","https://openalex.org/W2088943630","https://openalex.org/W2099148634","https://openalex.org/W2134693673","https://openalex.org/W2137963118","https://openalex.org/W2165231728","https://openalex.org/W2165366735","https://openalex.org/W2472793493","https://openalex.org/W3148190289","https://openalex.org/W6628691834","https://openalex.org/W6634863147","https://openalex.org/W6720614728"],"related_works":["https://openalex.org/W2021702679","https://openalex.org/W3038449658","https://openalex.org/W1582746211","https://openalex.org/W2251285835","https://openalex.org/W3129378740","https://openalex.org/W2607572736","https://openalex.org/W2266027327","https://openalex.org/W2278366184","https://openalex.org/W1486544172","https://openalex.org/W4206324154"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,25],"present":[4],"a":[5,82,88],"methodology":[6],"for":[7],"profiling":[8],"parallel":[9],"applications":[10],"executing":[11],"on":[12,30,81],"the":[13,21,46,65,70,76,99],"IBM":[14],"PowerXCell":[15],"8i":[16],"(commonly":[17],"referred":[18],"to":[19,113],"as":[20,42],"ldquoCellrdquo":[22],"processor).":[23],"Specifically,":[24],"examine":[26],"Cell-centric":[27],"MPI":[28],"programs":[29],"hybrid":[31,85],"clusters":[32],"containing":[33],"multiple":[34],"Opteron":[35],"and":[36,102],"Cell":[37],"processors":[38],"per":[39,59],"node":[40],"such":[41],"those":[43],"used":[44,112],"in":[45],"petascale":[47],"Roadrunner":[48],"system.":[49],"Our":[50,93],"implementation":[51],"incurs":[52],"less":[53],"than":[54],"3.2":[55],"mus":[56],"of":[57,69,78,84,90,95],"overhead":[58],"profile":[60],"call":[61,104],"while":[62],"efficiently":[63],"utilizing":[64],"limited":[66],"local":[67],"store":[68],"Cell's":[71],"SPE":[72],"cores.":[73],"We":[74],"demonstrate":[75],"use":[77],"our":[79],"profiler":[80],"cluster":[83],"nodes":[86],"running":[87],"suite":[89],"scientific":[91],"applications.":[92],"analyses":[94],"inter-SPE":[96],"communication":[97],"(across":[98],"entire":[100],"cluster)":[101],"function":[103],"patterns":[105],"provide":[106],"valuable":[107],"information":[108],"that":[109],"can":[110],"be":[111],"optimize":[114],"application":[115],"performance.":[116]},"counts_by_year":[{"year":2016,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
