{"id":"https://openalex.org/W2018348175","doi":"https://doi.org/10.1145/2086696.2086711","title":"Improving performance of nested loops on reconfigurable array processors","display_name":"Improving performance of nested loops on reconfigurable array processors","publication_year":2012,"publication_date":"2012-01-01","ids":{"openalex":"https://openalex.org/W2018348175","doi":"https://doi.org/10.1145/2086696.2086711","mag":"2018348175"},"language":"en","primary_location":{"id":"doi:10.1145/2086696.2086711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2086696.2086711","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2086696.2086711","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/2086696.2086711","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101845743","display_name":"Yong\u2013Joo Kim","orcid":"https://orcid.org/0000-0002-1212-9018"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Yongjoo Kim","raw_affiliation_strings":["Seoul National University, Korea","Seoul National University (Korea)"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University (Korea)","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100780257","display_name":"Jongeun Lee","orcid":"https://orcid.org/0000-0003-1523-2974"},"institutions":[{"id":"https://openalex.org/I48566637","display_name":"Ulsan National Institute of Science and Technology","ror":"https://ror.org/017cjz748","country_code":"KR","type":"education","lineage":["https://openalex.org/I48566637"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jongeun Lee","raw_affiliation_strings":["UNIST, South Korea","UNIST (South Korea)"],"affiliations":[{"raw_affiliation_string":"UNIST, South Korea","institution_ids":["https://openalex.org/I48566637"]},{"raw_affiliation_string":"UNIST (South Korea)","institution_ids":["https://openalex.org/I48566637"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Toan X. Mai","orcid":null},"institutions":[{"id":"https://openalex.org/I48566637","display_name":"Ulsan National Institute of Science and Technology","ror":"https://ror.org/017cjz748","country_code":"KR","type":"education","lineage":["https://openalex.org/I48566637"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Toan X. Mai","raw_affiliation_strings":["UNIST, South Korea","UNIST (South Korea)"],"affiliations":[{"raw_affiliation_string":"UNIST, South Korea","institution_ids":["https://openalex.org/I48566637"]},{"raw_affiliation_string":"UNIST (South Korea)","institution_ids":["https://openalex.org/I48566637"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082524666","display_name":"Yunheung Paek","orcid":"https://orcid.org/0000-0002-6412-2926"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yunheung Paek","raw_affiliation_strings":["Seoul National University, Korea","Seoul National University (Korea)"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University (Korea)","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101845743"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":5.5626,"has_fulltext":true,"cited_by_count":32,"citation_normalized_percentile":{"value":0.96092619,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"8","issue":"4","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8866515159606934},{"id":"https://openalex.org/keywords/nested-loop-join","display_name":"Nested loop join","score":0.8365973234176636},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7482367753982544},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7414429783821106},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6308357119560242},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.5782053470611572},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5634081959724426},{"id":"https://openalex.org/keywords/software-pipelining","display_name":"Software pipelining","score":0.5620245933532715},{"id":"https://openalex.org/keywords/loop-optimization","display_name":"Loop optimization","score":0.546122670173645},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.516344428062439},{"id":"https://openalex.org/keywords/loop-fission","display_name":"Loop fission","score":0.5079749226570129},{"id":"https://openalex.org/keywords/loop","display_name":"Loop (graph theory)","score":0.42888712882995605},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3294353485107422},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.32640498876571655},{"id":"https://openalex.org/keywords/optimizing-compiler","display_name":"Optimizing compiler","score":0.31533083319664},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.09686863422393799}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8866515159606934},{"id":"https://openalex.org/C1306188","wikidata":"https://www.wikidata.org/wiki/Q4060687","display_name":"Nested loop join","level":2,"score":0.8365973234176636},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7482367753982544},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7414429783821106},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6308357119560242},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.5782053470611572},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5634081959724426},{"id":"https://openalex.org/C188854837","wikidata":"https://www.wikidata.org/wiki/Q268469","display_name":"Software pipelining","level":3,"score":0.5620245933532715},{"id":"https://openalex.org/C29331672","wikidata":"https://www.wikidata.org/wiki/Q3354468","display_name":"Loop optimization","level":4,"score":0.546122670173645},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.516344428062439},{"id":"https://openalex.org/C134718785","wikidata":"https://www.wikidata.org/wiki/Q6675821","display_name":"Loop fission","level":3,"score":0.5079749226570129},{"id":"https://openalex.org/C184670325","wikidata":"https://www.wikidata.org/wiki/Q512604","display_name":"Loop (graph theory)","level":2,"score":0.42888712882995605},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3294353485107422},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.32640498876571655},{"id":"https://openalex.org/C190902152","wikidata":"https://www.wikidata.org/wiki/Q1325106","display_name":"Optimizing compiler","level":3,"score":0.31533083319664},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.09686863422393799},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2086696.2086711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2086696.2086711","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2086696.2086711","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},{"id":"pmh:oai:scholarworks.unist.ac.kr:201301/3814","is_oa":false,"landing_page_url":"http://www.scopus.com/inward/record.url?partnerID=HzOxMe3b&scp=84863291580","pdf_url":null,"source":{"id":"https://openalex.org/S4306401118","display_name":"Scholarworks@UNIST (Ulsan National Institute of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I48566637","host_organization_name":"Ulsan National Institute of Science and Technology","host_organization_lineage":["https://openalex.org/I48566637"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"ARTICLE"}],"best_oa_location":{"id":"doi:10.1145/2086696.2086711","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2086696.2086711","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2086696.2086711","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.5099999904632568}],"awards":[{"id":"https://openalex.org/G1094368579","display_name":null,"funder_award_id":"2011-0018609","funder_id":"https://openalex.org/F4320322349","funder_display_name":"Ministry of Education, Science and Technology"},{"id":"https://openalex.org/G3034753964","display_name":null,"funder_award_id":"grant","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G342704958","display_name":null,"funder_award_id":"funded","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G3827516242","display_name":null,"funder_award_id":"2011-001","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G4468227657","display_name":null,"funder_award_id":"2011-0000975","funder_id":"https://openalex.org/F4320322349","funder_display_name":"Ministry of Education, Science and Technology"},{"id":"https://openalex.org/G5069992840","display_name":null,"funder_award_id":"2010-0011534","funder_id":"https://openalex.org/F4320322349","funder_display_name":"Ministry of Education, Science and Technology"},{"id":"https://openalex.org/G626505518","display_name":null,"funder_award_id":"No. 201","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320322202","display_name":"IC Design Education Center","ror":"https://ror.org/005v57z85"},{"id":"https://openalex.org/F4320322348","display_name":"Korea Science and Engineering Foundation","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320322349","display_name":"Ministry of Education, Science and Technology","ror":"https://ror.org/01p262204"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2018348175.pdf","grobid_xml":"https://content.openalex.org/works/W2018348175.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W136905915","https://openalex.org/W286049110","https://openalex.org/W1485882819","https://openalex.org/W1502361557","https://openalex.org/W1511601046","https://openalex.org/W1564397886","https://openalex.org/W2008165887","https://openalex.org/W2013505463","https://openalex.org/W2020831346","https://openalex.org/W2025787141","https://openalex.org/W2042766074","https://openalex.org/W2095950905","https://openalex.org/W2102073017","https://openalex.org/W2102416334","https://openalex.org/W2108682772","https://openalex.org/W2112495948","https://openalex.org/W2114067856","https://openalex.org/W2116304229","https://openalex.org/W2122171990","https://openalex.org/W2123412205","https://openalex.org/W2134950466","https://openalex.org/W2135050419","https://openalex.org/W2159108969","https://openalex.org/W2160401437","https://openalex.org/W2215244614"],"related_works":["https://openalex.org/W2110618453","https://openalex.org/W4241609064","https://openalex.org/W1993227264","https://openalex.org/W2150334230","https://openalex.org/W217231416","https://openalex.org/W2080027614","https://openalex.org/W1511601046","https://openalex.org/W2135234700","https://openalex.org/W1564397886","https://openalex.org/W2135288949"],"abstract_inverted_index":{"Pipelining":[0],"algorithms":[1],"are":[2],"typically":[3],"concerned":[4],"with":[5],"improving":[6],"only":[7,20,150,162],"the":[8,12,29,54,58,82,104,109,133,145,151,155],"steady-state":[9],"performance,":[10],"or":[11],"kernel":[13,30],"time.":[14,31],"The":[15],"pipeline":[16,46],"setup":[17,47],"time":[18],"happens":[19],"once":[21],"and":[22,61,95,122],"therefore":[23],"can":[24,48,62,130,169],"be":[25],"negligible":[26],"compared":[27,143],"to":[28,42,53,102,140,144],"However,":[32],"for":[33,93],"Coarse-Grained":[34],"Reconfigurable":[35],"Architectures":[36],"(CGRAs)":[37],"used":[38],"as":[39],"a":[40,43,74,97,163],"coprocessor":[41],"main":[44],"processor,":[45],"take":[49],"much":[50],"longer":[51],"due":[52],"communication":[55],"delay":[56],"between":[57],"two":[59],"processors,":[60],"become":[63],"significant":[64],"if":[65],"it":[66],"is":[67],"repeated":[68],"in":[69,171],"an":[70],"outer":[71],"loop":[72,75],"of":[73,84,111,135,148,166],"nest.":[76],"In":[77],"this":[78],"paper":[79],"we":[80],"evaluate":[81],"overhead":[83],"such":[85],"non-kernel":[86],"execution":[87],"times":[88,142],"when":[89],"mapping":[90],"nested":[91,136],"loops":[92,119,137],"CGRAs,":[94],"propose":[96],"novel":[98],"architecture-compiler":[99],"cooperative":[100],"scheme":[101],"reduce":[103],"overhead,":[105],"while":[106],"also":[107],"minimizing":[108],"number":[110,165],"extra":[112],"configurations":[113,167],"required.":[114],"Our":[115],"experimental":[116],"results":[117],"using":[118],"from":[120],"multimedia":[121],"scientific":[123],"domains":[124],"demonstrate":[125],"that":[126,168],"our":[127,159],"proposed":[128],"techniques":[129,160],"greatly":[131],"increase":[132],"performance":[134],"by":[138,158],"up":[139],"2.87":[141],"conventional":[146],"approach":[147],"accelerating":[149],"innermost":[152],"loops.":[153],"Moreover,":[154],"mappings":[156],"generated":[157],"require":[161],"modest":[164],"fit":[170],"recent":[172],"reconfigurable":[173],"architectures.":[174]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
