{"id":"https://openalex.org/W2072763916","doi":"https://doi.org/10.1016/j.procs.2013.05.416","title":"Efficient Synchronization for Stencil Computations Using Dynamic Task Graphs","display_name":"Efficient Synchronization for Stencil Computations Using Dynamic Task Graphs","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W2072763916","doi":"https://doi.org/10.1016/j.procs.2013.05.416","mag":"2072763916"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2013.05.416","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2013.05.416","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2013.05.416","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039595706","display_name":"Zubair Wadood Bhatti","orcid":null},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]},{"id":"https://openalex.org/I39327780","display_name":"iMinds","ror":"https://ror.org/03baec336","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I39327780"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Zubair Wadood Bhatti","raw_affiliation_strings":["iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium","institution_ids":["https://openalex.org/I39327780","https://openalex.org/I99464096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069634715","display_name":"Roel Wuyts","orcid":"https://orcid.org/0000-0003-4236-995X"},"institutions":[{"id":"https://openalex.org/I39327780","display_name":"iMinds","ror":"https://ror.org/03baec336","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I39327780"]},{"id":"https://openalex.org/I4210114974","display_name":"IMEC","ror":"https://ror.org/02kcbn207","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I4210114974"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Roel Wuyts","raw_affiliation_strings":["Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium","imec, Kapeldreef 75, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","institution_ids":[]},{"raw_affiliation_string":"iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium","institution_ids":["https://openalex.org/I39327780","https://openalex.org/I99464096"]},{"raw_affiliation_string":"imec, Kapeldreef 75, B-3001 Leuven, Belgium","institution_ids":["https://openalex.org/I4210114974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082125013","display_name":"Pascal Costanza","orcid":"https://orcid.org/0000-0001-8894-3238"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pascal Costanza","raw_affiliation_strings":["Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","Intel, Belgium, Veldkant 31, 2550 Kontich, Belgium"],"affiliations":[{"raw_affiliation_string":"Intel ExaScience Lab, Kapeldreef 75, B-3001 Leuven, Belgium","institution_ids":[]},{"raw_affiliation_string":"Intel, Belgium, Veldkant 31, 2550 Kontich, Belgium","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069939159","display_name":"Davy Preuveneers","orcid":"https://orcid.org/0000-0001-6279-4430"},"institutions":[{"id":"https://openalex.org/I39327780","display_name":"iMinds","ror":"https://ror.org/03baec336","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I39327780"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Davy Preuveneers","raw_affiliation_strings":["iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium","institution_ids":["https://openalex.org/I39327780","https://openalex.org/I99464096"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112215809","display_name":"Yolande Berbers","orcid":null},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]},{"id":"https://openalex.org/I39327780","display_name":"iMinds","ror":"https://ror.org/03baec336","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I39327780"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Yolande Berbers","raw_affiliation_strings":["iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"iMinds-DistriNet, KU Leuven, Celestijnenlaan 200A, B-3001 Leuven, Belgium","institution_ids":["https://openalex.org/I39327780","https://openalex.org/I99464096"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5039595706"],"corresponding_institution_ids":["https://openalex.org/I39327780","https://openalex.org/I99464096"],"apc_list":null,"apc_paid":null,"fwci":0.3152,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.61503437,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"18","issue":null,"first_page":"2428","last_page":"2431"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.98789381980896},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8975390791893005},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7206323146820068},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6967933177947998},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.6870007514953613},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5811976790428162},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5604650378227234},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4820576608181},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.41148635745048523},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3834591209888458},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.18830835819244385},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.18380841612815857},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11553600430488586},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.07864966988563538}],"concepts":[{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.98789381980896},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8975390791893005},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7206323146820068},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6967933177947998},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.6870007514953613},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5811976790428162},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5604650378227234},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4820576608181},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.41148635745048523},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3834591209888458},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.18830835819244385},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.18380841612815857},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11553600430488586},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.07864966988563538},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1016/j.procs.2013.05.416","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2013.05.416","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},{"id":"pmh:oai:lirias2repo.kuleuven.be:123456789/411363","is_oa":false,"landing_page_url":"https://lirias.kuleuven.be/bitstream/123456789/411363/1/iccs.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306401954","display_name":"Lirias (KU Leuven)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I99464096","host_organization_name":"KU Leuven","host_organization_lineage":["https://openalex.org/I99464096"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"International Conference on Computational Science, Barcelona, Spain, 5-7 June 2013","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2013.05.416","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2013.05.416","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322308","display_name":"KU Leuven","ror":"https://ror.org/05f950310"},{"id":"https://openalex.org/F4320327336","display_name":"Vlaamse regering","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W1968116929","https://openalex.org/W2104512032","https://openalex.org/W2129298093"],"related_works":["https://openalex.org/W2039378765","https://openalex.org/W1569349362","https://openalex.org/W2003798513","https://openalex.org/W2890431355","https://openalex.org/W2151764765","https://openalex.org/W4376875029","https://openalex.org/W2315600872","https://openalex.org/W2097757554","https://openalex.org/W3149084271","https://openalex.org/W2150319905"],"abstract_inverted_index":{"Executing":[0],"stencil":[1,25,58,77,104],"computations":[2,59],"constitutes":[3],"a":[4,29,49,89,97],"significant":[5],"portion":[6],"of":[7,23,39,57,76],"execution":[8,82],"time":[9],"for":[10,52],"many":[11],"numerical":[12],"simulations":[13],"running":[14],"on":[15],"high":[16],"performance":[17],"computing":[18],"systems.":[19],"Most":[20],"parallel":[21],"implementations":[22],"these":[24,41],"operations":[26,78],"suffer":[27],"from":[28],"substantial":[30],"synchronization":[31,42,55,92],"overhead.":[32],"Furthermore,":[33],"with":[34],"the":[35,54,81],"rapidly":[36],"increasing":[37],"number":[38],"cores":[40],"costs":[43],"keep":[44],"rising.":[45],"This":[46],"paper":[47],"presents":[48],"novel":[50],"approach":[51],"reducing":[53],"overhead":[56,93],"by":[60,94],"leveraging":[61],"dynamic":[62],"task":[63],"graphs":[64],"to":[65,79,102],"avoid":[66],"global":[67],"barriers":[68],"and":[69,72,83,108],"minimizing":[70],"spin-waiting,":[71],"exploiting":[73],"basic":[74],"properties":[75],"optimize":[80],"memory":[84],"management.":[85],"Our":[86],"experiments":[87],"show":[88],"reduction":[90],"in":[91],"at":[95],"least":[96],"factor":[98],"four":[99],"when":[100],"compared":[101],"state-of-the-art":[103],"compilers":[105],"like":[106],"Pochoir":[107],"Patus.":[109]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
