{"id":"https://openalex.org/W3136698971","doi":"https://doi.org/10.1109/pact.2013.6618826","title":"Generating efficient data movement code for heterogeneous architectures with distributed-memory","display_name":"Generating efficient data movement code for heterogeneous architectures with distributed-memory","publication_year":2013,"publication_date":"2013-10-01","ids":{"openalex":"https://openalex.org/W3136698971","doi":"https://doi.org/10.1109/pact.2013.6618826","mag":"3136698971"},"language":"en","primary_location":{"id":"doi:10.1109/pact.2013.6618826","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2013.6618826","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051375902","display_name":"Lei Fang","orcid":"https://orcid.org/0000-0002-4966-2836"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lei Fang","raw_affiliation_strings":["Department of ISEE, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Department of ISEE, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047351206","display_name":"Peng Liu","orcid":"https://orcid.org/0000-0001-9107-6673"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Liu","raw_affiliation_strings":["Department of ISEE, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Department of ISEE, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028888316","display_name":"Qi Hu","orcid":"https://orcid.org/0000-0002-7876-2705"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Hu","raw_affiliation_strings":["Department of ISEE, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Department of ISEE, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078079786","display_name":"Michael Huang","orcid":"https://orcid.org/0000-0001-9799-2920"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael C. Huang","raw_affiliation_strings":["Department of ECE, University of Rochester, Rochester, NY, USA"],"affiliations":[{"raw_affiliation_string":"Department of ECE, University of Rochester, Rochester, NY, USA","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020058637","display_name":"Guofan Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126794","display_name":"IBM Research (China)","ror":"https://ror.org/02yg1pf55","country_code":"CN","type":"company","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126794"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guofan Jiang","raw_affiliation_strings":["IBM China Systems and Technology Laboratory, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"IBM China Systems and Technology Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I4210126794"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5051375902"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.5761,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.84796,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"375","last_page":"386"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11424","display_name":"Security and Verification in Computing","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.891538143157959},{"id":"https://openalex.org/keywords/directory","display_name":"Directory","score":0.7739791870117188},{"id":"https://openalex.org/keywords/cache-coherence","display_name":"Cache coherence","score":0.7618571519851685},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.7096282839775085},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5882542729377747},{"id":"https://openalex.org/keywords/mesi-protocol","display_name":"MESI protocol","score":0.5779197216033936},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.5426284670829773},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5366871356964111},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5339651703834534},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.41988605260849},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.34401118755340576},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.3305201530456543},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.27018433809280396}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.891538143157959},{"id":"https://openalex.org/C2777683733","wikidata":"https://www.wikidata.org/wiki/Q201456","display_name":"Directory","level":2,"score":0.7739791870117188},{"id":"https://openalex.org/C141917322","wikidata":"https://www.wikidata.org/wiki/Q1025017","display_name":"Cache coherence","level":5,"score":0.7618571519851685},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.7096282839775085},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5882542729377747},{"id":"https://openalex.org/C120936851","wikidata":"https://www.wikidata.org/wiki/Q1408065","display_name":"MESI protocol","level":5,"score":0.5779197216033936},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.5426284670829773},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5366871356964111},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5339651703834534},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.41988605260849},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.34401118755340576},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.3305201530456543},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.27018433809280396},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/pact.2013.6618826","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2013.6618826","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1571022506","https://openalex.org/W1598250351","https://openalex.org/W1769402780","https://openalex.org/W1844399225","https://openalex.org/W1969243435","https://openalex.org/W1985386844","https://openalex.org/W1997319712","https://openalex.org/W2016521571","https://openalex.org/W2032094184","https://openalex.org/W2043340768","https://openalex.org/W2046046256","https://openalex.org/W2046996113","https://openalex.org/W2083963764","https://openalex.org/W2097169285","https://openalex.org/W2097558053","https://openalex.org/W2100621037","https://openalex.org/W2102727118","https://openalex.org/W2116751788","https://openalex.org/W2120393760","https://openalex.org/W2132988218","https://openalex.org/W2136466435","https://openalex.org/W2137196255","https://openalex.org/W2139397536","https://openalex.org/W2140847726","https://openalex.org/W2143443573","https://openalex.org/W2145021036","https://openalex.org/W2151032144","https://openalex.org/W2154720270","https://openalex.org/W2157860533","https://openalex.org/W2160048271","https://openalex.org/W2166034599","https://openalex.org/W2169875292","https://openalex.org/W2171419639","https://openalex.org/W2545500460","https://openalex.org/W3140903683","https://openalex.org/W4236302577","https://openalex.org/W4237101508","https://openalex.org/W4238549726","https://openalex.org/W4243266883","https://openalex.org/W4243577185","https://openalex.org/W6635629227","https://openalex.org/W6674660205","https://openalex.org/W6679908912","https://openalex.org/W6680569787","https://openalex.org/W6728936925","https://openalex.org/W6792941224","https://openalex.org/W6820157634"],"related_works":["https://openalex.org/W4285204597","https://openalex.org/W2290195868","https://openalex.org/W3193874149","https://openalex.org/W2139534474","https://openalex.org/W2584505417","https://openalex.org/W2013212244","https://openalex.org/W2002047509","https://openalex.org/W2352722396","https://openalex.org/W2107914397","https://openalex.org/W3026856133"],"abstract_inverted_index":{"Mainstream":[0],"chip":[1],"multiprocessors":[2,50],"already":[3],"include":[4],"a":[5,53,78,142,149,153,159,175,200,205],"significant":[6,160],"number":[7,144],"of":[8,30,69,91,107,123,138,145,162,178,227,249,264,269],"cores":[9],"that":[10,93,134,158,208,243],"make":[11],"straightforward":[12],"snooping-based":[13],"cache":[14,38,139],"coherence":[15,41,58,73,108,193],"less":[16],"appropriate.":[17],"Further":[18],"increase":[19,120],"in":[20,232],"core":[21],"count":[22],"will":[23],"almost":[24],"certainly":[25],"require":[26],"more":[27,239,260],"sophisticated":[28],"tracking":[29],"data":[31],"sharing":[32],"to":[33,71,89,119,167,219],"minimize":[34],"unnecessary":[35],"messages":[36],"and":[37,51,114,195,229],"snooping.":[39],"Directory-based":[40],"has":[42],"been":[43],"the":[44,121,135,182,191,233,247],"standard":[45],"solution":[46],"for":[47,56,82,97,127,181],"large-scale":[48],"shared-memory":[49],"is":[52,77,131],"clear":[54],"candidate":[55],"on-chip":[57],"maintenance.":[59],"A":[60],"vanilla":[61],"directory":[62,124,163,250,257],"design,":[63],"however,":[64],"suffers":[65],"from":[66],"inefficient":[67],"use":[68,174],"storage":[70,80,258],"keep":[72],"metadata.":[74],"The":[75],"result":[76],"high":[79],"overhead":[81,87],"larger":[83],"scales.":[84],"Reducing":[85],"this":[86,101],"leads":[88],"saving":[90],"resources":[92],"can":[94,172,196,255],"be":[95,197],"redeployed":[96],"other":[98],"purposes.":[99],"In":[100],"paper,":[102],"we":[103],"exploit":[104,148],"familiar":[105],"characteristics":[106,194],"metadata,":[109],"but":[110,155],"with":[111,152,266],"novel":[112],"angles":[113],"propose":[115,204],"two":[116],"practical":[117],"techniques":[118,245],"expressiveness":[122,248],"entries,":[125,251],"particularly":[126],"chip-multiprocessors.":[128],"First,":[129],"it":[130,224],"well":[132],"known":[133],"vast":[136],"majority":[137],"lines":[140],"have":[141],"small":[143],"sharers.":[146],"We":[147,171,203,241],"related":[150],"fact":[151],"subtle":[154],"important":[156],"difference:":[157],"portion":[161],"entries":[164,231],"only":[165],"need":[166],"track":[168],"one":[169],"node.":[170],"thus":[173,236],"hybrid":[176],"representation":[177],"sharers":[179],"list":[180],"whole":[183],"set.":[184],"Second,":[185],"contiguous":[186],"memory":[187],"regions":[188,238],"often":[189],"share":[190],"same":[192,234],"tracked":[198],"by":[199,259],"single":[201],"entry.":[202],"multi-granular":[206],"mechanism":[207],"does":[209],"not":[210],"rely":[211],"on":[212],"any":[213],"profiling,":[214],"compiler,":[215],"or":[216],"OS":[217],"support":[218],"identify":[220],"such":[221],"regions.":[222],"Moreover,":[223],"allows":[225],"co-existence":[226],"line":[228],"region":[230],"locations,":[235],"making":[237],"applicable.":[240],"show":[242],"both":[244],"improve":[246],"and,":[252],"when":[253],"combined,":[254],"reduce":[256],"than":[261],"an":[262],"order":[263],"magnitude":[265],"negligible":[267],"loss":[268],"precision.":[270]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
