{"id":"https://openalex.org/W4399771913","doi":"https://doi.org/10.1145/3615979.3656056","title":"Follow the Leader: Alternating CPU/GPU Computations in PDES","display_name":"Follow the Leader: Alternating CPU/GPU Computations in PDES","publication_year":2024,"publication_date":"2024-06-18","ids":{"openalex":"https://openalex.org/W4399771913","doi":"https://doi.org/10.1145/3615979.3656056"},"language":"en","primary_location":{"id":"doi:10.1145/3615979.3656056","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3615979.3656056","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th ACM SIGSIM Conference on Principles of Advanced Discrete Simulation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070045696","display_name":"Romolo Marotta","orcid":"https://orcid.org/0000-0001-7589-9274"},"institutions":[{"id":"https://openalex.org/I116067653","display_name":"University of Rome Tor Vergata","ror":"https://ror.org/02p77k626","country_code":"IT","type":"education","lineage":["https://openalex.org/I116067653"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Romolo Marotta","raw_affiliation_strings":["DICII, Tor Vergata University of Rome, Italy"],"raw_orcid":"https://orcid.org/0000-0001-7589-9274","affiliations":[{"raw_affiliation_string":"DICII, Tor Vergata University of Rome, Italy","institution_ids":["https://openalex.org/I116067653"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062882537","display_name":"Alessandro Pellegrini","orcid":"https://orcid.org/0000-0002-0179-9868"},"institutions":[{"id":"https://openalex.org/I116067653","display_name":"University of Rome Tor Vergata","ror":"https://ror.org/02p77k626","country_code":"IT","type":"education","lineage":["https://openalex.org/I116067653"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessandro Pellegrini","raw_affiliation_strings":["DICII, Tor Vergata University of Rome, Italy"],"raw_orcid":"https://orcid.org/0000-0002-0179-9868","affiliations":[{"raw_affiliation_string":"DICII, Tor Vergata University of Rome, Italy","institution_ids":["https://openalex.org/I116067653"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042423448","display_name":"Philipp Andelfinger","orcid":"https://orcid.org/0000-0002-0211-7136"},"institutions":[{"id":"https://openalex.org/I4665924","display_name":"University of Rostock","ror":"https://ror.org/03zdwsf69","country_code":"DE","type":"education","lineage":["https://openalex.org/I4665924"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Philipp Andelfinger","raw_affiliation_strings":["Institute for Visual and Analytic Computing, University of Rostock, Germany"],"raw_orcid":"https://orcid.org/0000-0002-0211-7136","affiliations":[{"raw_affiliation_string":"Institute for Visual and Analytic Computing, University of Rostock, Germany","institution_ids":["https://openalex.org/I4665924"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5070045696"],"corresponding_institution_ids":["https://openalex.org/I116067653"],"apc_list":null,"apc_paid":null,"fwci":2.3051,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.88855721,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"47","last_page":"51"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7394806146621704},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6813297271728516},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6172391176223755},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.5044358968734741},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.46333280205726624},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4189074635505676},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3858048617839813},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12858864665031433},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.1204613447189331}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7394806146621704},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6813297271728516},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6172391176223755},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.5044358968734741},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.46333280205726624},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4189074635505676},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3858048617839813},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12858864665031433},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.1204613447189331}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3615979.3656056","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3615979.3656056","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th ACM SIGSIM Conference on Principles of Advanced Discrete Simulation","raw_type":"proceedings-article"},{"id":"pmh:oai:art.torvergata.it:2108/381384","is_oa":false,"landing_page_url":"https://hdl.handle.net/2108/381384","pdf_url":null,"source":{"id":"https://openalex.org/S4306400993","display_name":"Cineca Institutional Research Information System (Tor Vergata University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I116067653","host_organization_name":"University of Rome Tor Vergata","host_organization_lineage":["https://openalex.org/I116067653"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.75,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G1620070718","display_name":null,"funder_award_id":"M4C2-19","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G8040828129","display_name":null,"funder_award_id":"2022TSYYKJ","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1970049774","https://openalex.org/W1984429368","https://openalex.org/W2009634341","https://openalex.org/W2017710077","https://openalex.org/W2041515442","https://openalex.org/W2047012348","https://openalex.org/W2050883661","https://openalex.org/W2085866051","https://openalex.org/W2100584922","https://openalex.org/W2102719229","https://openalex.org/W2131314877","https://openalex.org/W2134044496","https://openalex.org/W2139962185","https://openalex.org/W2147762963","https://openalex.org/W2154439184","https://openalex.org/W2615453758","https://openalex.org/W2734733109","https://openalex.org/W2810476603","https://openalex.org/W2945447941","https://openalex.org/W3033608378","https://openalex.org/W3159007080","https://openalex.org/W3160342304","https://openalex.org/W4206466197","https://openalex.org/W4233137219","https://openalex.org/W4383671702"],"related_works":["https://openalex.org/W1963859303","https://openalex.org/W2364044215","https://openalex.org/W2389600408","https://openalex.org/W240129890","https://openalex.org/W3048701459","https://openalex.org/W3213381848","https://openalex.org/W2149078538","https://openalex.org/W2080146221","https://openalex.org/W2370314112","https://openalex.org/W1912958759"],"abstract_inverted_index":{"Despite":[0],"the":[1,26,98,119,127,130,150,165,176],"successes":[2],"of":[3,29,139],"graphics":[4],"processing":[5],"units":[6],"(GPUs)":[7],"in":[8,11],"accelerating":[9],"simulations":[10],"several":[12],"research":[13],"fields,":[14],"their":[15,173],"use":[16],"is":[17,61,100],"largely":[18],"restricted":[19],"to":[20,63,80,163],"domain-specific":[21],"workloads":[22],"that":[23,78],"consistently":[24],"offer":[25],"large":[27],"degree":[28],"inherent":[30],"parallelism":[31],"and":[32,57,136,158,179,183,185],"computational":[33],"intensity":[34],"at":[35],"which":[36],"GPUs":[37],"excel.":[38],"When":[39],"targeting":[40],"generic":[41],"discrete-event":[42,71],"simulations,":[43],"whose":[44],"dynamics":[45],"can":[46],"vary":[47],"wildly":[48],"over":[49,197],"time,":[50],"a":[51,55,69,93,104,123,154,198],"static":[52,199],"choice":[53],"between":[54],"GPU-based":[56],"traditional":[58],"CPU-based":[59],"execution":[60,73,134,191],"likely":[62],"be":[64],"suboptimal.":[65],"Here,":[66],"we":[67],"explore":[68],"parallel":[70],"(PDES)":[72],"scheme":[74,125,141],"for":[75,129,148],"CPU-GPU":[76],"platforms":[77],"aims":[79],"approximate":[81],"an":[82,89,113,145],"optimal":[83],"dynamic":[84],"device":[85,96,110,152,166,200],"choice.":[86,201],"Starting":[87],"from":[88,112],"intermediate":[90,114],"model":[91,115,156],"state,":[92,157],"current":[94],"\u201cleader\u201d":[95],"running":[97],"simulation":[99],"periodically":[101],"challenged":[102],"by":[103],"brief":[105],"concurrent":[106],"run":[107],"on":[108,118,143],"another":[109],"starting":[111],"state.":[116],"Based":[117],"gathered":[120],"performance":[121,161],"measurements,":[122],"forecasting":[124,162],"determines":[126],"leader":[128],"next":[131],"period.":[132],"The":[133],"time":[135,192],"power":[137],"consumption":[138,196],"this":[140],"hinge":[142],"1)":[144],"efficient":[146],"mechanism":[147],"providing":[149],"\u201cfollower\u201d":[151],"with":[153],"consistent":[155],"2)":[159],"robust":[160],"justify":[164],"choices.":[167],"We":[168],"present":[169],"these":[170],"building":[171],"blocks,":[172],"implementation":[174],"combining":[175],"existing":[177],"CPU":[178],"GPU":[180],"simulators":[181],"ROOT-Sim":[182],"GPUTW,":[184],"measurement":[186],"results":[187],"demonstrating":[188],"substantially":[189],"reduced":[190],"without":[193],"increasing":[194],"energy":[195]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2026-05-20T08:49:12.498775","created_date":"2025-10-10T00:00:00"}
