{"id":"https://openalex.org/W4396943513","doi":"https://doi.org/10.1145/3659914.3659921","title":"Using Read-After-Read Dependencies to Control Task-Granularity","display_name":"Using Read-After-Read Dependencies to Control Task-Granularity","publication_year":2024,"publication_date":"2024-05-15","ids":{"openalex":"https://openalex.org/W4396943513","doi":"https://doi.org/10.1145/3659914.3659921"},"language":"en","primary_location":{"id":"doi:10.1145/3659914.3659921","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3659914.3659921","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Platform for Advanced Scientific Computing Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3659914.3659921","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036713642","display_name":"Andres Gartmann","orcid":"https://orcid.org/0009-0009-1746-2256"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Andres Gartmann","raw_affiliation_strings":["mynatix ag, Basel, Switzerland"],"raw_orcid":"https://orcid.org/0009-0009-1746-2256","affiliations":[{"raw_affiliation_string":"mynatix ag, Basel, Switzerland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011908306","display_name":"Mathias M\u00fcller","orcid":"https://orcid.org/0009-0008-1750-0817"},"institutions":[{"id":"https://openalex.org/I1324989862","display_name":"Federal Office of Meteorology and Climatology MeteoSwiss","ror":"https://ror.org/03wbkx358","country_code":"CH","type":"government","lineage":["https://openalex.org/I1324989862"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Mathias M\u00fcller","raw_affiliation_strings":["meteoblue ag, Basel, Switzerland"],"raw_orcid":"https://orcid.org/0009-0008-1750-0817","affiliations":[{"raw_affiliation_string":"meteoblue ag, Basel, Switzerland","institution_ids":["https://openalex.org/I1324989862"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5036713642"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0509023,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9016637802124023},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.8578715324401855},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.7736152410507202},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7712696194648743},{"id":"https://openalex.org/keywords/automatic-parallelization","display_name":"Automatic parallelization","score":0.7102557420730591},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5676976442337036},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5577766299247742},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.5381762385368347},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5014793872833252},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.49563753604888916},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.47755131125450134},{"id":"https://openalex.org/keywords/instruction-level-parallelism","display_name":"Instruction-level parallelism","score":0.47391045093536377},{"id":"https://openalex.org/keywords/optimizing-compiler","display_name":"Optimizing compiler","score":0.46475473046302795},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4559626281261444},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.42841485142707825},{"id":"https://openalex.org/keywords/program-optimization","display_name":"Program optimization","score":0.42298731207847595},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.42235875129699707},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3926345109939575},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.30611854791641235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.13872435688972473},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.07254448533058167}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9016637802124023},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.8578715324401855},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.7736152410507202},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7712696194648743},{"id":"https://openalex.org/C164833996","wikidata":"https://www.wikidata.org/wiki/Q2323839","display_name":"Automatic parallelization","level":3,"score":0.7102557420730591},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5676976442337036},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5577766299247742},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.5381762385368347},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5014793872833252},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.49563753604888916},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.47755131125450134},{"id":"https://openalex.org/C140763907","wikidata":"https://www.wikidata.org/wiki/Q2714055","display_name":"Instruction-level parallelism","level":3,"score":0.47391045093536377},{"id":"https://openalex.org/C190902152","wikidata":"https://www.wikidata.org/wiki/Q1325106","display_name":"Optimizing compiler","level":3,"score":0.46475473046302795},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4559626281261444},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.42841485142707825},{"id":"https://openalex.org/C139571649","wikidata":"https://www.wikidata.org/wiki/Q1156793","display_name":"Program optimization","level":3,"score":0.42298731207847595},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.42235875129699707},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3926345109939575},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30611854791641235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.13872435688972473},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.07254448533058167},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3659914.3659921","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3659914.3659921","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Platform for Advanced Scientific Computing Conference","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3659914.3659921","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3659914.3659921","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Platform for Advanced Scientific Computing Conference","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W90084074","https://openalex.org/W1518236483","https://openalex.org/W1635779336","https://openalex.org/W1820550104","https://openalex.org/W1833044483","https://openalex.org/W2046712264","https://openalex.org/W2094969361","https://openalex.org/W2126089060","https://openalex.org/W2135736783","https://openalex.org/W2167089275","https://openalex.org/W2268502312","https://openalex.org/W2274823567","https://openalex.org/W2796604629","https://openalex.org/W2913591599","https://openalex.org/W2913813246","https://openalex.org/W3158965208","https://openalex.org/W4232333333","https://openalex.org/W4234573405","https://openalex.org/W4246166885","https://openalex.org/W4250981202"],"related_works":["https://openalex.org/W4240606930","https://openalex.org/W2526302199","https://openalex.org/W2003935582","https://openalex.org/W2950520577","https://openalex.org/W3007272028","https://openalex.org/W2040503315","https://openalex.org/W168408236","https://openalex.org/W2494130044","https://openalex.org/W2126220043","https://openalex.org/W1567267707"],"abstract_inverted_index":{"In":[0],"compiler":[1],"theory,":[2],"data":[3,42],"analysis":[4,76],"is":[5,120,131,144],"used":[6,16],"to":[7,27,50,60,90,110,133,141,153,173],"exploit":[8],"Instruction":[9],"Level":[10],"Parallelism":[11],"(ILP).":[12],"Three":[13],"dependencies":[14],"are":[15,25,171],"in":[17,57],"modern":[18],"compilers":[19],"and":[20,24,77,106,127,135,168],"hardware":[21],"schemes":[22],"efficiently":[23],"fundamental":[26],"any":[28,58],"code":[29,59,75,89,105,115],"compilation.":[30],"Read-after-read":[31],"(RAR)":[32],"has":[33],"been":[34],"left":[35],"out,":[36],"as":[37],"it":[38],"cannot":[39],"cause":[40],"a":[41,47,91,123,142,162],"hazard.":[43],"This":[44,83],"article":[45],"introduces":[46,78],"novel":[48,118],"method":[49,65],"use":[51],"the":[52,100,104,129,147,155,159],"additional":[53],"dependence":[54],"information":[55,98],"contained":[56],"enhance":[61],"automatic":[62,139],"parallelization.":[63],"The":[64,94,117,138,151],"builds":[66],"groups":[67],"of":[68,103,158],"arbitrary":[69],"sequential":[70],"instruction":[71],"chains":[72],"during":[73,113],"static":[74,114],"potential-transfers":[79],"between":[80],"these":[81],"groups.":[82],"gives":[84],"new":[85,148],"opportunities":[86,109],"when":[87],"optimizing":[88],"parallel-processing":[92],"hardware.":[93],"segmentation":[95,130,149],"enables":[96],"more":[97],"concerning":[99],"potential":[101],"parallelization":[102,140],"enhances":[107],"optimization":[108],"be":[111],"gained":[112],"analysis.":[116],"principle":[119],"introduced":[121],"using":[122,146],"very":[124],"simple":[125],"example":[126],"then":[128],"applied":[132],"task-":[134],"data-parallelism":[136],"examples.":[137],"multicore-platform":[143],"demonstrated":[145],"method.":[150],"ability":[152],"forecast":[154],"optimal":[156],"distribution":[157],"segments":[160],"for":[161],"platform":[163],"with":[164],"two":[165],"key":[166],"parameters":[167],"resulting":[169],"codes":[170],"compared":[172],"measured":[174],"speedups.":[175]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
