{"id":"https://openalex.org/W4221141809","doi":"https://doi.org/10.1145/3563553","title":"Automatic Creation of High-bandwidth Memory Architectures from Domain-specific Languages: The Case of Computational Fluid Dynamics","display_name":"Automatic Creation of High-bandwidth Memory Architectures from Domain-specific Languages: The Case of Computational Fluid Dynamics","publication_year":2022,"publication_date":"2022-09-15","ids":{"openalex":"https://openalex.org/W4221141809","doi":"https://doi.org/10.1145/3563553"},"language":"en","primary_location":{"id":"doi:10.1145/3563553","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3563553","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3563553","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},"type":"preprint","indexed_in":["crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3563553","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034465540","display_name":"Stephanie Soldavini","orcid":"https://orcid.org/0000-0001-7379-8007"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Stephanie Soldavini","raw_affiliation_strings":["Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067091126","display_name":"Karl F. A. Friebel","orcid":"https://orcid.org/0000-0001-9534-3978"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"Technische Universit\u00e4t Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Karl Friebel","raw_affiliation_strings":["Technische Universit\u00e4t Dresden, Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Dresden, Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027068516","display_name":"Mattia Tibaldi","orcid":"https://orcid.org/0000-0003-1113-3987"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mattia Tibaldi","raw_affiliation_strings":["Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046466505","display_name":"Gerald Hempel","orcid":"https://orcid.org/0000-0002-4737-8612"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"Technische Universit\u00e4t Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gerald Hempel","raw_affiliation_strings":["Technische Universit\u00e4t Dresden, Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Dresden, Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030115692","display_name":"Jer\u00f3nimo Castrill\u00f3n","orcid":"https://orcid.org/0000-0002-5007-445X"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"Technische Universit\u00e4t Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jeronimo Castrillon","raw_affiliation_strings":["Technische Universit\u00e4t Dresden, Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Dresden, Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072400487","display_name":"Christian Pilato","orcid":"https://orcid.org/0000-0001-9315-1788"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Christian Pilato","raw_affiliation_strings":["Politecnico di Milano, Milano, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, Milano, Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5034465540"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.2318,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.46624434,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"16","issue":"2","first_page":"1","last_page":"34"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.9707000255584717,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8633390069007874},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.7006754279136658},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.6980941295623779},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6539207100868225},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6083632111549377},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.5226204991340637},{"id":"https://openalex.org/keywords/domain-specific-language","display_name":"Domain-specific language","score":0.48964983224868774},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4894055426120758},{"id":"https://openalex.org/keywords/design-flow","display_name":"Design flow","score":0.46477630734443665},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.35415881872177124}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8633390069007874},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.7006754279136658},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.6980941295623779},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6539207100868225},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6083632111549377},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.5226204991340637},{"id":"https://openalex.org/C135257023","wikidata":"https://www.wikidata.org/wiki/Q691358","display_name":"Domain-specific language","level":2,"score":0.48964983224868774},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4894055426120758},{"id":"https://openalex.org/C37135326","wikidata":"https://www.wikidata.org/wiki/Q931942","display_name":"Design flow","level":2,"score":0.46477630734443665},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.35415881872177124},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3563553","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3563553","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3563553","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1220543","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1220543","pdf_url":"https://re.public.polimi.it/bitstream/11311/1220543/1/_TRETS_final__CFD4FPGA%20%281%29.pdf","source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"doi:10.48550/arxiv.2203.10850","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2203.10850","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.1145/3563553","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3563553","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3563553","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7900000214576721,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4221141809.pdf","grobid_xml":"https://content.openalex.org/works/W4221141809.grobid-xml"},"referenced_works_count":54,"referenced_works":["https://openalex.org/W347636100","https://openalex.org/W1558370006","https://openalex.org/W1621885647","https://openalex.org/W2020071510","https://openalex.org/W2055312318","https://openalex.org/W2086364561","https://openalex.org/W2107076945","https://openalex.org/W2169719116","https://openalex.org/W2267881438","https://openalex.org/W2343695530","https://openalex.org/W2481351383","https://openalex.org/W2492686975","https://openalex.org/W2522116871","https://openalex.org/W2594169960","https://openalex.org/W2622148586","https://openalex.org/W2626616508","https://openalex.org/W2786320458","https://openalex.org/W2798482398","https://openalex.org/W2898373684","https://openalex.org/W2920536219","https://openalex.org/W2955391308","https://openalex.org/W2963610942","https://openalex.org/W2967088612","https://openalex.org/W3036715599","https://openalex.org/W3090815597","https://openalex.org/W3093557412","https://openalex.org/W3093757369","https://openalex.org/W3094071641","https://openalex.org/W3111765144","https://openalex.org/W3112412839","https://openalex.org/W3121665290","https://openalex.org/W3122998669","https://openalex.org/W3133215150","https://openalex.org/W3133347161","https://openalex.org/W3158338328","https://openalex.org/W3162360055","https://openalex.org/W3167833281","https://openalex.org/W3170921841","https://openalex.org/W3173856255","https://openalex.org/W3186292924","https://openalex.org/W3196320218","https://openalex.org/W3200826900","https://openalex.org/W3206299349","https://openalex.org/W3206387782","https://openalex.org/W3207198460","https://openalex.org/W3207488955","https://openalex.org/W3212867926","https://openalex.org/W4226443139","https://openalex.org/W4234889424","https://openalex.org/W4246166885","https://openalex.org/W4288072573","https://openalex.org/W6774508117","https://openalex.org/W6793059938","https://openalex.org/W6884967357"],"related_works":["https://openalex.org/W320786","https://openalex.org/W1078554","https://openalex.org/W386281","https://openalex.org/W5144792","https://openalex.org/W4102181","https://openalex.org/W20079516","https://openalex.org/W5349046","https://openalex.org/W16319575","https://openalex.org/W10163365","https://openalex.org/W6022940"],"abstract_inverted_index":{"Numerical":[0],"simulations":[1],"can":[2,28,91],"help":[3],"solve":[4],"complex":[5],"problems.":[6],"Most":[7],"of":[8,121,165],"these":[9],"algorithms":[10],"are":[11,36,61],"massively":[12,84],"parallel":[13,85,141],"and":[14,43,50,97,124,143,176],"thus":[15],"good":[16],"candidates":[17],"for":[18,46,79],"FPGA":[19,26,186],"acceleration":[20],"thanks":[21],"to":[22,82,95,137,169,190],"spatial":[23],"parallelism.":[24],"Modern":[25],"devices":[27],"leverage":[29],"high-bandwidth":[30],"memory":[31,44,146],"technologies,":[32],"but":[33],"when":[34,179],"applications":[35,162],"memory-bound":[37],"designers":[38],"must":[39],"craft":[40],"advanced":[41],"communication":[42],"architectures":[45],"efficient":[47,194],"data":[48,150],"movement":[49],"on-chip":[51],"storage.":[52],"This":[53],"development":[54],"process":[55],"requires":[56],"hardware":[57,102,134],"design":[58],"skills":[59],"that":[60,148],"uncommon":[62],"in":[63],"domain-specific":[64,77],"experts.":[65],"In":[66],"this":[67,93],"article,":[68],"we":[69],"propose":[70],"an":[71,132],"automated":[72],"tool":[73],"flow":[74,94,115,136],"from":[75,117],"a":[76,111,126,144,181],"language":[78],"tensor":[80,122],"expressions":[81],"generate":[83,138],"accelerators":[86,142],"on":[87],"high-bandwidth-memory-equipped":[88],"FPGAs.":[89],"Designers":[90],"use":[92,105],"integrate":[96],"evaluate":[98],"various":[99],"compiler":[100,130],"or":[101],"optimizations.":[103],"We":[104,160],"computational":[106],"fluid":[107],"dynamics":[108],"(CFD)":[109],"as":[110],"paradigmatic":[112],"example.":[113],"Our":[114,185],"starts":[116],"the":[118,156],"high-level":[119],"specification":[120],"operations":[123],"combines":[125],"multi-level":[127],"intermediate":[128],"representation\u2013based":[129],"with":[131,140,163,172],"in-house":[133],"generation":[135],"systems":[139],"specialized":[145],"architecture":[147],"moves":[149],"efficiently,":[151],"aiming":[152],"at":[153],"fully":[154],"exploiting":[155],"available":[157],"CPU-FPGA":[158],"bandwidth.":[159],"simulated":[161],"millions":[164],"elements,":[166],"achieving":[167],"up":[168,189],"103":[170],"GFLOPS":[171],"one":[173],"compute":[174],"unit":[175],"custom":[177],"precision":[178],"targeting":[180],"Xilinx":[182],"Alveo":[183],"U280.":[184],"implementation":[187],"is":[188],"25\u00d7":[191],"more":[192],"energy":[193],"than":[195],"expert-crafted":[196],"Intel":[197],"CPU":[198],"implementations.":[199]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2022-04-03T00:00:00"}
