{"id":"https://openalex.org/W7117234435","doi":"https://doi.org/10.48550/arxiv.2512.19851","title":"An Adaptive Distributed Stencil Abstraction for GPUs","display_name":"An Adaptive Distributed Stencil Abstraction for GPUs","publication_year":2025,"publication_date":"2025-12-22","ids":{"openalex":"https://openalex.org/W7117234435","doi":"https://doi.org/10.48550/arxiv.2512.19851"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.19851","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19851","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.19851","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030288518","display_name":"Aditya Bhosale","orcid":"https://orcid.org/0000-0003-1876-6138"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bhosale, Aditya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5051465480","display_name":"Laxmikant V. Kal\u00e9","orcid":"https://orcid.org/0000-0001-9673-8445"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kale, Laxmikant","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5030288518"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9053000211715698,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9053000211715698,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.018699999898672104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.018400000408291817,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.7742000222206116},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.6152999997138977},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.6054999828338623},{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.44839999079704285},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.3813999891281128},{"id":"https://openalex.org/keywords/digital-subscriber-line","display_name":"Digital subscriber line","score":0.35010001063346863},{"id":"https://openalex.org/keywords/metaprogramming","display_name":"Metaprogramming","score":0.3479999899864197},{"id":"https://openalex.org/keywords/abstraction-layer","display_name":"Abstraction layer","score":0.34529998898506165}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8215000033378601},{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.7742000222206116},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.6152999997138977},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.6054999828338623},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.44839999079704285},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4399999976158142},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4268999993801117},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3813999891281128},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.36419999599456787},{"id":"https://openalex.org/C201374245","wikidata":"https://www.wikidata.org/wiki/Q104534","display_name":"Digital subscriber line","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C35390924","wikidata":"https://www.wikidata.org/wiki/Q661075","display_name":"Metaprogramming","level":2,"score":0.3479999899864197},{"id":"https://openalex.org/C147358964","wikidata":"https://www.wikidata.org/wiki/Q1200992","display_name":"Abstraction layer","level":3,"score":0.34529998898506165},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3269999921321869},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.32679998874664307},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.325300008058548},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.30970001220703125},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.30379998683929443},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.29010000824928284},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26980000734329224},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.25940001010894775},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.19851","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19851","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.19851","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19851","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.7032195329666138}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,26],"scientific":[1],"computing":[2],"ecosystem":[3],"in":[4,18],"Python":[5],"is":[6,69],"largely":[7],"confined":[8],"to":[9,87,94],"single-node":[10],"parallelism,":[11],"creating":[12],"a":[13,42,73,83,108,112,119,138,144],"gap":[14],"between":[15],"high-level":[16],"prototyping":[17],"NumPy":[19,146],"and":[20,32,81,117,143],"high-performance":[21,140],"execution":[22],"on":[23,64,76],"modern":[24],"supercomputers.":[25],"increasing":[27],"prevalence":[28],"of":[29,102,115,122],"hardware":[30],"accelerators":[31],"the":[33,77,89,99,123],"need":[34],"for":[35,61],"energy":[36],"efficiency":[37],"have":[38],"made":[39],"resource":[40,100],"adaptivity":[41],"critical":[43],"requirement,":[44],"yet":[45],"traditional":[46],"HPC":[47],"abstractions":[48],"remain":[49],"rigid.":[50],"To":[51],"address":[52],"these":[53],"challenges,":[54],"we":[55,127],"present":[56,118],"an":[57],"adaptive,":[58],"distributed":[59],"abstraction":[60,68,104,131],"stencil":[62,141],"computations":[63],"multi-node":[65],"GPUs.":[66],"This":[67],"built":[70],"using":[71],"CharmTyles,":[72],"framework":[74],"based":[75],"adaptive":[78],"Charm++":[79],"runtime,":[80],"features":[82],"familiar":[84],"NumPy-like":[85],"syntax":[86],"minimize":[88],"porting":[90],"effort":[91],"from":[92],"prototype":[93],"production":[95],"code.":[96],"We":[97],"showcase":[98],"elasticity":[101],"our":[103,130],"by":[105],"dynamically":[106],"rescaling":[107],"running":[109],"application":[110],"across":[111],"different":[113],"number":[114],"nodes":[116],"performance":[120,134],"analysis":[121],"associated":[124],"overheads.":[125],"Furthermore,":[126],"demonstrate":[128],"that":[129],"achieves":[132],"significant":[133],"improvements":[135],"over":[136],"both":[137],"specialized,":[139],"DSL":[142],"generalized":[145],"replacement.":[147]},"counts_by_year":[],"updated_date":"2025-12-25T23:15:44.422516","created_date":"2025-12-25T00:00:00"}
