{"id":"https://openalex.org/W2792647449","doi":"https://doi.org/10.1145/3174243.3174251","title":"Graph-Theoretically Optimal Memory Banking for Stencil-Based Computing Kernels","display_name":"Graph-Theoretically Optimal Memory Banking for Stencil-Based Computing Kernels","publication_year":2018,"publication_date":"2018-02-15","ids":{"openalex":"https://openalex.org/W2792647449","doi":"https://doi.org/10.1145/3174243.3174251","mag":"2792647449"},"language":"en","primary_location":{"id":"doi:10.1145/3174243.3174251","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3174243.3174251","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 ACM/SIGDA International Symposium on Field-Programmable Gate Arrays","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://stars.library.ucf.edu/scopus2015/9483","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013235794","display_name":"J. P. Escobedo","orcid":"https://orcid.org/0000-0003-2413-7119"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Juan Escobedo","raw_affiliation_strings":["University of Central Florida, Oviedo, FL, USA"],"affiliations":[{"raw_affiliation_string":"University of Central Florida, Oviedo, FL, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060908808","display_name":"Mingjie Lin","orcid":"https://orcid.org/0000-0002-3225-4406"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingjie Lin","raw_affiliation_strings":["University of Central Florida, Oviedo, FL, USA"],"affiliations":[{"raw_affiliation_string":"University of Central Florida, Oviedo, FL, USA","institution_ids":["https://openalex.org/I106165777"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5013235794"],"corresponding_institution_ids":["https://openalex.org/I106165777"],"apc_list":null,"apc_paid":null,"fwci":3.421,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.92806508,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"199","last_page":"208"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stencil","display_name":"Stencil","score":0.8486738801002502},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8185083866119385},{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.613906741142273},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.596264660358429},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5057311058044434},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.41755998134613037},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.41105917096138},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3503206670284271},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.101003497838974},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.10019570589065552},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09292802214622498}],"concepts":[{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.8486738801002502},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8185083866119385},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.613906741142273},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.596264660358429},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5057311058044434},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.41755998134613037},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.41105917096138},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3503206670284271},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.101003497838974},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.10019570589065552},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09292802214622498},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3174243.3174251","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3174243.3174251","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 ACM/SIGDA International Symposium on Field-Programmable Gate Arrays","raw_type":"proceedings-article"},{"id":"pmh:oai:stars.library.ucf.edu:scopus2015-10482","is_oa":true,"landing_page_url":"https://stars.library.ucf.edu/scopus2015/9483","pdf_url":null,"source":{"id":"https://openalex.org/S4210172555","display_name":"Journal of International Crisis and Risk Communication Research","issn_l":"2576-0017","issn":["2576-0017","2576-0025"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scopus Export 2015-2019","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:stars.library.ucf.edu:scopus2015-10482","is_oa":true,"landing_page_url":"https://stars.library.ucf.edu/scopus2015/9483","pdf_url":null,"source":{"id":"https://openalex.org/S4210172555","display_name":"Journal of International Crisis and Risk Communication Research","issn_l":"2576-0017","issn":["2576-0017","2576-0025"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scopus Export 2015-2019","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.47999998927116394,"display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G3740958974","display_name":null,"funder_award_id":"1553056","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5164495282","display_name":null,"funder_award_id":"1319884","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1982506822","https://openalex.org/W1989763262","https://openalex.org/W2000031176","https://openalex.org/W2019259761","https://openalex.org/W2039974221","https://openalex.org/W2049151402","https://openalex.org/W2058625399","https://openalex.org/W2098925700","https://openalex.org/W2116015397","https://openalex.org/W2154755153","https://openalex.org/W2165689945","https://openalex.org/W2584219348","https://openalex.org/W2588368824"],"related_works":["https://openalex.org/W2039378765","https://openalex.org/W2003798513","https://openalex.org/W2315600872","https://openalex.org/W2151764765","https://openalex.org/W2890431355","https://openalex.org/W4376875029","https://openalex.org/W3149084271","https://openalex.org/W4247008888","https://openalex.org/W2150319905","https://openalex.org/W2962978274"],"abstract_inverted_index":{"High-Level":[0],"Synthesis":[1],"(HLS)":[2],"has":[3,43,58],"advanced":[4],"significantly":[5,175],"in":[6,27,144],"compiling":[7],"high-level":[8],"\"soft\u00bb\u00bb":[9],"programs":[10],"into":[11],"efficient":[12],"register-transfer":[13],"level":[14],"(RTL)":[15],"\"hard\u00bb\u00bb":[16],"specifications.":[17],"However,":[18,67],"manually":[19],"rewriting":[20],"C-like":[21],"code":[22],"is":[23],"still":[24],"often":[25],"required":[26,94],"order":[28],"to":[29,72,130],"effectively":[30],"optimize":[31],"the":[32,89,121,153,165],"access":[33,64,171],"performance":[34,65],"of":[35,91,167],"synthesized":[36],"memory":[37,51,56,84,92,103,133,155,170],"subsystems.":[38],"As":[39],"such,":[40],"extensive":[41],"research":[42],"been":[44,59],"performed":[45],"on":[46],"developing":[47],"and":[48],"implementing":[49],"automated":[50],"optimization":[52],"techniques,":[53],"among":[54],"which":[55,174],"banking":[57,85,104,123,134],"a":[60,76],"key":[61,69],"technique":[62],"for":[63,95,136,158],"improvement.":[66],"several":[68],"questions":[70],"remain":[71],"be":[73],"answered:":[74],"given":[75,160],"stencil-based":[77,118,138],"computing":[78,139],"kernel,":[79],"what":[80],"constitutes":[81],"an":[82,101,109],"optimal":[83,102,122],"scheme":[86,105],"that":[87],"minimizes":[88],"number":[90],"banks":[93],"conflict-free":[96],"accesses?":[97],"Furthermore,":[98],"if":[99],"such":[100],"exists,":[106],"how":[107],"can":[108],"FPGA":[110],"designer":[111],"automatically":[112],"determine":[113],"it?":[114],"Finally,":[115],"does":[116],"any":[117,159],"kernel":[119],"have":[120],"scheme?":[124],"In":[125],"this":[126],"paper":[127],"we":[128],"attempt":[129],"optimally":[131],"solve":[132],"problem":[135],"synthesizing":[137],"kernels":[140],"with":[141],"well-known":[142],"theorems":[143],"graph":[145],"theory.":[146],"Our":[147],"graph-based":[148],"methodology":[149],"not":[150],"only":[151],"computes":[152],"minimum":[154],"partition":[156],"factor":[157],"stencil,":[161],"but":[162],"also":[163],"exploits":[164],"repeatability":[166],"coloring":[168],"entire":[169],"conflict":[172],"graph,":[173],"improves":[176],"hardware":[177],"efficiency.":[178]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
