{"id":"https://openalex.org/W2071055701","doi":"https://doi.org/10.1145/2304576.2304583","title":"One stone two birds","display_name":"One stone two birds","publication_year":2012,"publication_date":"2012-06-25","ids":{"openalex":"https://openalex.org/W2071055701","doi":"https://doi.org/10.1145/2304576.2304583","mag":"2071055701"},"language":"en","primary_location":{"id":"doi:10.1145/2304576.2304583","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2304576.2304583","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM international conference on Supercomputing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053834265","display_name":"Ziyu Guo","orcid":"https://orcid.org/0000-0002-4792-1398"},"institutions":[{"id":"https://openalex.org/I4210087596","display_name":"Qualcomm (United States)","ror":"https://ror.org/002zrf773","country_code":"US","type":"company","lineage":["https://openalex.org/I4210087596"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ziyu Guo","raw_affiliation_strings":["Qualcomm CDMA Technologies, San Diego, CA, USA","Qualcomm CDMA Technologies, San Diego, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Qualcomm CDMA Technologies, San Diego, CA, USA","institution_ids":["https://openalex.org/I4210087596"]},{"raw_affiliation_string":"Qualcomm CDMA Technologies, San Diego, CA, USA#TAB#","institution_ids":["https://openalex.org/I4210087596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059368105","display_name":"Bo Wu","orcid":"https://orcid.org/0000-0001-6658-6452"},"institutions":[{"id":"https://openalex.org/I16285277","display_name":"William & Mary","ror":"https://ror.org/03hsf0573","country_code":"US","type":"education","lineage":["https://openalex.org/I16285277"]},{"id":"https://openalex.org/I267592682","display_name":"Williams (United States)","ror":"https://ror.org/007zhvp17","country_code":"US","type":"company","lineage":["https://openalex.org/I267592682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bo Wu","raw_affiliation_strings":["College of William and Mary, Williamsburg, VA, USA","[College of William & Mary, Williamsburg, VA, USA]"],"affiliations":[{"raw_affiliation_string":"College of William and Mary, Williamsburg, VA, USA","institution_ids":["https://openalex.org/I16285277","https://openalex.org/I267592682"]},{"raw_affiliation_string":"[College of William & Mary, Williamsburg, VA, USA]","institution_ids":["https://openalex.org/I16285277"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100624451","display_name":"Xipeng Shen","orcid":"https://orcid.org/0000-0003-3599-8010"},"institutions":[{"id":"https://openalex.org/I16285277","display_name":"William & Mary","ror":"https://ror.org/03hsf0573","country_code":"US","type":"education","lineage":["https://openalex.org/I16285277"]},{"id":"https://openalex.org/I267592682","display_name":"Williams (United States)","ror":"https://ror.org/007zhvp17","country_code":"US","type":"company","lineage":["https://openalex.org/I267592682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xipeng Shen","raw_affiliation_strings":["College of William and Mary, Williamsburg, VA, USA","[College of William & Mary, Williamsburg, VA, USA]"],"affiliations":[{"raw_affiliation_string":"College of William and Mary, Williamsburg, VA, USA","institution_ids":["https://openalex.org/I16285277","https://openalex.org/I267592682"]},{"raw_affiliation_string":"[College of William & Mary, Williamsburg, VA, USA]","institution_ids":["https://openalex.org/I16285277"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053834265"],"corresponding_institution_ids":["https://openalex.org/I4210087596"],"apc_list":null,"apc_paid":null,"fwci":0.2901,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57551059,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"25","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8561913371086121},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7741910219192505},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.6951860785484314},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6533777117729187},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.5799069404602051},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5245450139045715},{"id":"https://openalex.org/keywords/spmd","display_name":"SPMD","score":0.43957608938217163},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4281269311904907},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3359590768814087},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.27793365716934204},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.22124141454696655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8561913371086121},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7741910219192505},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.6951860785484314},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6533777117729187},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.5799069404602051},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5245450139045715},{"id":"https://openalex.org/C7042729","wikidata":"https://www.wikidata.org/wiki/Q2289219","display_name":"SPMD","level":2,"score":0.43957608938217163},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4281269311904907},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3359590768814087},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.27793365716934204},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.22124141454696655},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2304576.2304583","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2304576.2304583","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM international conference on Supercomputing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W108745714","https://openalex.org/W1191470825","https://openalex.org/W1502558230","https://openalex.org/W1843198456","https://openalex.org/W1992851788","https://openalex.org/W2013247896","https://openalex.org/W2055813380","https://openalex.org/W2065392434","https://openalex.org/W2080592089","https://openalex.org/W2081829536","https://openalex.org/W2083056254","https://openalex.org/W2087725506","https://openalex.org/W2089482246","https://openalex.org/W2119010809","https://openalex.org/W2124556751","https://openalex.org/W2128329055","https://openalex.org/W2129232868","https://openalex.org/W2140375692","https://openalex.org/W2145866640","https://openalex.org/W2150476673","https://openalex.org/W2156831150","https://openalex.org/W2160786443","https://openalex.org/W2169880332","https://openalex.org/W2170634604","https://openalex.org/W2507749557","https://openalex.org/W7074239008"],"related_works":["https://openalex.org/W1606512765","https://openalex.org/W2113326345","https://openalex.org/W2058965144","https://openalex.org/W183653846","https://openalex.org/W1520729804","https://openalex.org/W2164382479","https://openalex.org/W2514606205","https://openalex.org/W160207554","https://openalex.org/W2059556329","https://openalex.org/W3012895752"],"abstract_inverted_index":{"As":[0],"an":[1,95],"approach":[2],"to":[3,87],"promoting":[4],"whole-system":[5],"synergy":[6],"on":[7,31,76],"a":[8,68,81,88,102,112,137],"heterogeneous":[9],"computing":[10],"system,":[11],"compilation":[12],"of":[13,35,63,139],"fine-grained":[14,113],"SPMD-threaded":[15],"code(e.g.,":[16],"GPU":[17],"CUDA":[18],"code)":[19],"for":[20,99,107,115],"multicore":[21],"CPU":[22],"has":[23],"drawn":[24],"some":[25],"recent":[26],"attentions.":[27],"This":[28],"paper":[29],"concentrates":[30],"two":[32],"important":[33],"sources":[34],"inefficiency":[36,64],"that":[37,60,77,122],"limit":[38],"existing":[39],"translators.":[40],"The":[41],"first":[42],"is":[43,49,126],"overly":[44],"strong":[45],"synchronizations;":[46],"the":[47,71,123],"second":[48],"thread-level":[50,82,116],"partially":[51],"redundant":[52],"computations.":[53],"In":[54],"this":[55],"paper,":[56],"we":[57,79],"point":[58],"out":[59],"both":[61,130],"kinds":[62],"essentially":[65],"come":[66],"from":[67],"single":[69],"reason:":[70],"non-uniformity":[72],"among":[73],"threads.":[74],"Based":[75],"observation,":[78],"present":[80],"dependence":[83],"analysis,":[84],"which":[85],"leads":[86],"code":[89,108],"generator":[90],"with":[91],"three":[92],"novel":[93],"features:":[94],"instance-level":[96],"instruction":[97],"scheduler":[98],"synchronization":[100],"relaxation,":[101],"graph":[103],"pattern":[104],"recognition":[105],"scheme":[106],"shape":[109],"optimization,":[110],"and":[111],"analysis":[114],"partial":[117],"redundancy":[118],"removal.":[119],"Experiments":[120],"show":[121],"unified":[124],"solution":[125],"effective":[127],"in":[128],"resolving":[129],"inefficiencies,":[131],"yielding":[132],"speedup":[133],"as":[134,136],"much":[135],"factor":[138],"14.":[140]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
