{"id":"https://openalex.org/W4252470283","doi":"https://doi.org/10.1109/ipdps.2006.1639595","title":"Conjugate gradient sparse solvers: performance-power characteristics","display_name":"Conjugate gradient sparse solvers: performance-power characteristics","publication_year":2006,"publication_date":"2006-01-01","ids":{"openalex":"https://openalex.org/W4252470283","doi":"https://doi.org/10.1109/ipdps.2006.1639595"},"language":"en","primary_location":{"id":"doi:10.1109/ipdps.2006.1639595","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2006.1639595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 20th IEEE International Parallel &amp; Distributed Processing Symposium","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113655168","display_name":"Konrad Malkowski","orcid":null},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"K. Malkowski","raw_affiliation_strings":["Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008180707","display_name":"Ingyu Lee","orcid":"https://orcid.org/0000-0002-9838-6428"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ingyu Lee","raw_affiliation_strings":["Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102868534","display_name":"Padma Raghavan","orcid":"https://orcid.org/0009-0002-6785-2112"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"P. Raghavan","raw_affiliation_strings":["Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110890725","display_name":"M.J. Irwin","orcid":null},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M.J. Irwin","raw_affiliation_strings":["Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5113655168"],"corresponding_institution_ids":["https://openalex.org/I130769515"],"apc_list":null,"apc_paid":null,"fwci":1.1283,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.81455286,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"12","issue":null,"first_page":"8 pp.","last_page":"8 pp."},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.815201997756958},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.770655632019043},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7486937046051025},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.5774357914924622},{"id":"https://openalex.org/keywords/conjugate-gradient-method","display_name":"Conjugate gradient method","score":0.5401678085327148},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5194346904754639},{"id":"https://openalex.org/keywords/frequency-scaling","display_name":"Frequency scaling","score":0.5074967741966248},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.48302826285362244},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.44835951924324036},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.4451194107532501},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4447018504142761},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3596733510494232},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.34468770027160645},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23232170939445496}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.815201997756958},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.770655632019043},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7486937046051025},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.5774357914924622},{"id":"https://openalex.org/C81184566","wikidata":"https://www.wikidata.org/wiki/Q1191895","display_name":"Conjugate gradient method","level":2,"score":0.5401678085327148},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5194346904754639},{"id":"https://openalex.org/C157742956","wikidata":"https://www.wikidata.org/wiki/Q3237776","display_name":"Frequency scaling","level":3,"score":0.5074967741966248},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.48302826285362244},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.44835951924324036},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.4451194107532501},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4447018504142761},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3596733510494232},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.34468770027160645},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23232170939445496},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ipdps.2006.1639595","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2006.1639595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 20th IEEE International Parallel &amp; Distributed Processing Symposium","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.9100000262260437}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W826415870","https://openalex.org/W1575701986","https://openalex.org/W1609496979","https://openalex.org/W1624897526","https://openalex.org/W1981885118","https://openalex.org/W1987393840","https://openalex.org/W2095957868","https://openalex.org/W2104225326","https://openalex.org/W2116334158","https://openalex.org/W2137541800","https://openalex.org/W2140731293","https://openalex.org/W2143011780","https://openalex.org/W2166122567","https://openalex.org/W2169046973","https://openalex.org/W3140903683","https://openalex.org/W4237281620","https://openalex.org/W4247641071","https://openalex.org/W6681456407","https://openalex.org/W6684183497","https://openalex.org/W6792941224"],"related_works":["https://openalex.org/W1967088250","https://openalex.org/W2034060070","https://openalex.org/W2054730497","https://openalex.org/W4229957265","https://openalex.org/W2544771389","https://openalex.org/W2386899346","https://openalex.org/W3082608044","https://openalex.org/W2375597358","https://openalex.org/W2369649360","https://openalex.org/W309072591"],"abstract_inverted_index":{"We":[0,21,45,67,96,110,166],"characterize":[1],"the":[2,8,37,43,91,153,161,172,192],"performance":[3,56,94,126,180],"and":[4,27,32,80,106,115,135,148,171,181,191],"power":[5,50,60,79,117,134,145,182],"attributes":[6],"of":[7,39,42,62,93,119,194,214],"conjugate":[9],"gradient":[10],"(CG)":[11],"sparse":[12],"solver":[13],"which":[14],"is":[15,141],"widely":[16],"used":[17,122],"in":[18,133,152],"scientific":[19,216],"applications.":[20,217],"use":[22,168],"cycle-accurate":[23],"simulations":[24],"with":[25,123,131,210],"SimpleScalar":[26],"Wattch,":[28],"on":[29,188],"a":[30,40],"processor":[31],"memory":[33,101,105],"architecture":[34],"similar":[35],"to":[36,160,177],"configuration":[38,155],"node":[41],"BlueGene/L.":[44],"first":[46],"demonstrate":[47,111,178],"that":[48,70,112,179,200],"substantial":[49],"savings":[51,82],"can":[52,64,76,127,184,203],"be":[53,65,77,128],"obtained":[54],"without":[55],"degradation":[57],"if":[58,71,205],"low":[59,116],"modes":[61,118],"caches":[63,120],"utilized.":[66],"next":[68],"show":[69],"Dynamic":[72],"Voltage":[73],"Scaling":[74],"(DVS)":[75],"used,":[78],"energy":[81,149],"are":[83,87,121,208],"possible,":[84],"but":[85],"these":[86,124],"realized":[88],"only":[89],"at":[90,156,163],"expense":[92],"penalties.":[95],"then":[97],"consider":[98],"two":[99],"simple":[100],"subsystem":[102],"optimizations,":[103,125],"namely":[104],"level-2":[107],"cache":[108],"prefetching.":[109],"when":[113],"DVS":[114],"improved":[129],"significantly":[130,186],"reductions":[132],"energy.":[136],"For":[137],"example,":[138],"execution":[139],"time":[140],"reduced":[142],"by":[143,146,150],"23%,":[144],"55%":[147],"65%":[151],"final":[154],"500":[157],"MHz":[158],"relative":[159],"original":[162],"1":[164],"GHz.":[165],"also":[167],"our":[169],"codes":[170,211],"CG":[173],"NAS":[174],"benchmark":[175],"code":[176,195],"profiles":[183],"vary":[185],"depending":[187],"matrix":[189],"properties":[190],"level":[193],"tuning.":[196],"These":[197],"results":[198],"indicate":[199],"architectural":[201],"evaluations":[202],"benefit":[204],"traditional":[206],"benchmarks":[207],"augmented":[209],"more":[212],"representative":[213],"tuned":[215]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
