{"id":"https://openalex.org/W4396817063","doi":"https://doi.org/10.1145/3665643","title":"(De/Re)-Composition of Data-Parallel Computations via Multi-Dimensional Homomorphisms","display_name":"(De/Re)-Composition of Data-Parallel Computations via Multi-Dimensional Homomorphisms","publication_year":2024,"publication_date":"2024-05-22","ids":{"openalex":"https://openalex.org/W4396817063","doi":"https://doi.org/10.1145/3665643"},"language":"en","primary_location":{"id":"doi:10.1145/3665643","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3665643","pdf_url":null,"source":{"id":"https://openalex.org/S41449414","display_name":"ACM Transactions on Programming Languages and Systems","issn_l":"0164-0925","issn":["0164-0925","1558-4593"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Programming Languages and Systems","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.05118","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017852288","display_name":"Ari Rasch","orcid":"https://orcid.org/0000-0002-0286-0755"},"institutions":[{"id":"https://openalex.org/I22465464","display_name":"University of M\u00fcnster","ror":"https://ror.org/00pd74e08","country_code":"DE","type":"education","lineage":["https://openalex.org/I22465464"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Ari Rasch","raw_affiliation_strings":["University of Muenster, Germany"],"raw_orcid":"https://orcid.org/0000-0002-0286-0755","affiliations":[{"raw_affiliation_string":"University of Muenster, Germany","institution_ids":["https://openalex.org/I22465464"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5017852288"],"corresponding_institution_ids":["https://openalex.org/I22465464"],"apc_list":null,"apc_paid":null,"fwci":3.2173,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.92885572,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"46","issue":"3","first_page":"1","last_page":"74"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.7815999984741211,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.7815999984741211,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.7760000228881836,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.7088000178337097,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/homomorphism","display_name":"Homomorphism","score":0.7828826904296875},{"id":"https://openalex.org/keywords/composition","display_name":"Composition (language)","score":0.7092142701148987},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6677026748657227},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5481827259063721},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49259883165359497},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.39048197865486145},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.28686678409576416},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2734798491001129},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.21587282419204712},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.05895400047302246}],"concepts":[{"id":"https://openalex.org/C4042151","wikidata":"https://www.wikidata.org/wiki/Q215111","display_name":"Homomorphism","level":2,"score":0.7828826904296875},{"id":"https://openalex.org/C40231798","wikidata":"https://www.wikidata.org/wiki/Q1333743","display_name":"Composition (language)","level":2,"score":0.7092142701148987},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6677026748657227},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5481827259063721},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49259883165359497},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.39048197865486145},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28686678409576416},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2734798491001129},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.21587282419204712},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.05895400047302246},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3665643","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3665643","pdf_url":null,"source":{"id":"https://openalex.org/S41449414","display_name":"ACM Transactions on Programming Languages and Systems","issn_l":"0164-0925","issn":["0164-0925","1558-4593"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Programming Languages and Systems","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2405.05118","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.05118","pdf_url":"https://arxiv.org/pdf/2405.05118","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.05118","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.05118","pdf_url":"https://arxiv.org/pdf/2405.05118","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G940864400","display_name":null,"funder_award_id":"470527619","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":104,"referenced_works":["https://openalex.org/W92174080","https://openalex.org/W1191262899","https://openalex.org/W1559314111","https://openalex.org/W1565278861","https://openalex.org/W1964962870","https://openalex.org/W1970141743","https://openalex.org/W1975001341","https://openalex.org/W1983051972","https://openalex.org/W1997978901","https://openalex.org/W2000882268","https://openalex.org/W2017627169","https://openalex.org/W2023415862","https://openalex.org/W2024880014","https://openalex.org/W2047656763","https://openalex.org/W2049890071","https://openalex.org/W2055312318","https://openalex.org/W2071110673","https://openalex.org/W2073061372","https://openalex.org/W2077143534","https://openalex.org/W2090504951","https://openalex.org/W2093843662","https://openalex.org/W2095875205","https://openalex.org/W2096070062","https://openalex.org/W2098220211","https://openalex.org/W2100218206","https://openalex.org/W2101807486","https://openalex.org/W2102976251","https://openalex.org/W2103838950","https://openalex.org/W2104958979","https://openalex.org/W2107096626","https://openalex.org/W2108315152","https://openalex.org/W2128249697","https://openalex.org/W2136952590","https://openalex.org/W2151788546","https://openalex.org/W2152506070","https://openalex.org/W2162265576","https://openalex.org/W2166696935","https://openalex.org/W2258220747","https://openalex.org/W2291192259","https://openalex.org/W2336894004","https://openalex.org/W2471164860","https://openalex.org/W2495029002","https://openalex.org/W2515471963","https://openalex.org/W2521727659","https://openalex.org/W2582080653","https://openalex.org/W2590246587","https://openalex.org/W2644985445","https://openalex.org/W2743401659","https://openalex.org/W2772612468","https://openalex.org/W2791673912","https://openalex.org/W2898099374","https://openalex.org/W2898442528","https://openalex.org/W2912012512","https://openalex.org/W2913154098","https://openalex.org/W2914500262","https://openalex.org/W2917361956","https://openalex.org/W2932894012","https://openalex.org/W2943813107","https://openalex.org/W2944745903","https://openalex.org/W2949967139","https://openalex.org/W2954698171","https://openalex.org/W2954733970","https://openalex.org/W2962835968","https://openalex.org/W2964301839","https://openalex.org/W2979365412","https://openalex.org/W2987684178","https://openalex.org/W2987973366","https://openalex.org/W2999868588","https://openalex.org/W3012249773","https://openalex.org/W3047091820","https://openalex.org/W3086093316","https://openalex.org/W3090487264","https://openalex.org/W3115446638","https://openalex.org/W3118873362","https://openalex.org/W3122286897","https://openalex.org/W3122888791","https://openalex.org/W3123054690","https://openalex.org/W3132222959","https://openalex.org/W3136479147","https://openalex.org/W3139323122","https://openalex.org/W3158477547","https://openalex.org/W3195241200","https://openalex.org/W3196818429","https://openalex.org/W4205614912","https://openalex.org/W4206384897","https://openalex.org/W4220690649","https://openalex.org/W4220818654","https://openalex.org/W4221031300","https://openalex.org/W4225158182","https://openalex.org/W4237609491","https://openalex.org/W4240382083","https://openalex.org/W4245208434","https://openalex.org/W4246166885","https://openalex.org/W4248445937","https://openalex.org/W4281768830","https://openalex.org/W4281932226","https://openalex.org/W4318541538","https://openalex.org/W4321184872","https://openalex.org/W4321496341","https://openalex.org/W4327930469","https://openalex.org/W4392266023","https://openalex.org/W4396817063","https://openalex.org/W6600662749","https://openalex.org/W6601630192"],"related_works":["https://openalex.org/W4308159138","https://openalex.org/W4327811209","https://openalex.org/W1979798674","https://openalex.org/W3169947911","https://openalex.org/W3037616202","https://openalex.org/W2963079901","https://openalex.org/W390508480","https://openalex.org/W2294450783","https://openalex.org/W2375240985","https://openalex.org/W1429949169"],"abstract_inverted_index":{"Data-parallel":[0],"computations,":[1,9,114,295,304],"such":[2,30],"as":[3,144,280],"linear":[4,90,297],"algebra":[5,91,298],"routines":[6,92],"and":[7,35,41,67,86,118,157,170,173,191,220,245,250,256,283,289,301,308],"stencil":[8,98,300],"constitute":[10],"one":[11],"of":[12,38,83,113,136,154,161,176,211,214,226,247,293],"the":[13,33,43,49,101,122,133,168,205,208,224,241,248],"most":[14],"relevant":[15],"classes":[16,213],"in":[17,204],"parallel":[18,163],"computing,":[19],"e.g.,":[20,65],"due":[21,315],"to":[22,48,57,72,79,147,150,202,316],"their":[23,254,317],"importance":[24],"for":[25,32,54,61,109,121,158,185,240,290,319],"deep":[26,169,320],"learning.":[27,321],"Efficiently":[28],"de-composing":[29],"computations":[31,63,85,156,309],"memory":[34,172,257],"core":[36,174],"hierarchies":[37,175],"modern":[39],"architectures":[40,87],"re-composing":[42],"computed":[44],"intermediate":[45],"results":[46],"back":[47],"final":[50],"result\u2014we":[51],"say":[52],"(de/re)-composition":[53,112,129,183,209],"short\u2014is":[55],"key":[56],"achieve":[58,267],"high":[59,313],"performance":[60,269],"these":[62],"on,":[64],"GPU":[66,95],"CPU.":[68],"Current":[69],"high-level":[70],"approaches":[71,102,216],"generating":[73,231],"data-parallel":[74,84,155,294],"code":[75,232],"are":[76],"often":[77],"restricted":[78],"a":[80,105,110,127,151,186,291],"particular":[81,242],"subclass":[82],"(e.g.,":[88,253],"only":[89,94,97],"on":[93,104,132,286],"or":[96],"computations),":[99],"and/or":[100],"rely":[103],"user-guided":[106],"optimization":[107],"process":[108],"well-performing":[111],"which":[115],"is":[116,142,199],"complex":[117,171],"error":[119],"prone":[120],"user.":[123],"We":[124,194],"formally":[125],"introduce":[126],"systematic":[128],"approach,":[130],"based":[131],"algebraic":[134],"formalism":[135],"Multi-Dimensional":[137],"Homomorphisms":[138],"(MDHs).":[139],"Our":[140],"approach":[141,184,198],"designed":[143],"general":[145],"enough":[146,201],"be":[148,235],"applicable":[149],"wide":[152],"range":[153],"various":[159],"kinds":[160],"target":[162,167,243],"architectures.":[164],"To":[165],"efficiently":[166],"contemporary":[177],"architectures,":[178],"we":[179,221,266],"exploit":[180],"our":[181,197,227,260],"introduced":[182],"correct-by-construction,":[187],"parametrized":[188],"cache":[189],"blocking,":[190],"parallelization":[192],"strategy.":[193],"show":[195],"that":[196,223,233,263,310],"powerful":[200],"express,":[203],"same":[206],"formalism,":[207],"strategies":[210,228],"different":[212],"state-of-the-art":[215,271],"(scheduling-based,":[217],"polyhedral,":[218],"etc.),":[219],"demonstrate":[222],"parameters":[225],"enable":[229],"systematically":[230],"can":[234],"fully":[236],"automatically":[237],"optimized":[238],"(auto-tuned)":[239],"architecture":[244],"characteristics":[246],"input":[249],"output":[251],"data":[252,305],"sizes":[255],"layouts).":[258],"Particularly,":[259],"experiments":[261],"confirm":[262],"via":[264],"auto-tuning,":[265],"higher":[268],"than":[270],"approaches,":[272],"including":[273,296],"hand-optimized":[274],"solutions":[275],"provided":[276],"by":[277],"vendors":[278],"(such":[279],"NVIDIA":[281],"cuBLAS/cuDNN":[282],"Intel":[284],"oneMKL/oneDNN),":[285],"real-world":[287],"datasets":[288],"variety":[292],"routines,":[299],"quantum":[302],"chemistry":[303],"mining":[306],"algorithms,":[307],"recently":[311],"gained":[312],"attention":[314],"relevance":[318]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2}],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2025-10-10T00:00:00"}
