{"id":"https://openalex.org/W2006295906","doi":"https://doi.org/10.1109/estimedia.2014.6962353","title":"Optimized memory access support for data layout conversion on heterogeneous multi-core systems","display_name":"Optimized memory access support for data layout conversion on heterogeneous multi-core systems","publication_year":2014,"publication_date":"2014-10-01","ids":{"openalex":"https://openalex.org/W2006295906","doi":"https://doi.org/10.1109/estimedia.2014.6962353","mag":"2006295906"},"language":"en","primary_location":{"id":"doi:10.1109/estimedia.2014.6962353","is_oa":false,"landing_page_url":"https://doi.org/10.1109/estimedia.2014.6962353","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 12th Symposium on Embedded Systems for Real-time Multimedia (ESTIMedia)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101046409","display_name":"Chia-Chen Hsu","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chia-Chen Hsu","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Taiwan","Department of Computer Science, National Tsing Hua University, , Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]},{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, , Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041275339","display_name":"Cheng-Yen Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Cheng-Yen Lin","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Taiwan","Department of Computer Science, National Tsing Hua University, , Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]},{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, , Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021283402","display_name":"Shin Kai Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shin Kai Chen","raw_affiliation_strings":["Department of Electronics Engineering, National Chiao Tung University, Taiwan","Dept. of Electronics Engineering, National Chiao\u2010Tung University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronics Engineering, National Chiao Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]},{"raw_affiliation_string":"Dept. of Electronics Engineering, National Chiao\u2010Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100642145","display_name":"Chih\u2010Wei Liu","orcid":"https://orcid.org/0000-0002-3006-9856"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chih-Wei Liu","raw_affiliation_strings":["Department of Electronics Engineering, National Chiao Tung University, Taiwan","Dept. of Electronics Engineering, National Chiao\u2010Tung University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronics Engineering, National Chiao Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]},{"raw_affiliation_string":"Dept. of Electronics Engineering, National Chiao\u2010Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038803698","display_name":"Jenq\u2010Kuen Lee","orcid":"https://orcid.org/0000-0001-9919-6258"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jenq-Kuen Lee","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Taiwan","Department of Computer Science, National Tsing Hua University, , Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Taiwan","institution_ids":["https://openalex.org/I25846049"]},{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, , Taiwan","institution_ids":["https://openalex.org/I25846049"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6302,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.68604552,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"10","issue":null,"first_page":"128","last_page":"137"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8633551597595215},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.5892122983932495},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5360617637634277},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5027635097503662},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.44122952222824097},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.4214567244052887},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.41948607563972473},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.41250520944595337},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.38101038336753845},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3385053873062134},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3293871283531189},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.13053244352340698},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.12433061003684998}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8633551597595215},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5892122983932495},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5360617637634277},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5027635097503662},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.44122952222824097},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.4214567244052887},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.41948607563972473},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.41250520944595337},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.38101038336753845},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3385053873062134},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3293871283531189},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.13053244352340698},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.12433061003684998},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/estimedia.2014.6962353","is_oa":false,"landing_page_url":"https://doi.org/10.1109/estimedia.2014.6962353","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 12th Symposium on Embedded Systems for Real-time Multimedia (ESTIMedia)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W182691100","https://openalex.org/W1588915715","https://openalex.org/W1986453598","https://openalex.org/W2016352575","https://openalex.org/W2020322423","https://openalex.org/W2044203422","https://openalex.org/W2061341864","https://openalex.org/W2080592089","https://openalex.org/W2083056254","https://openalex.org/W2099680095","https://openalex.org/W2105937753","https://openalex.org/W2128539477","https://openalex.org/W2128853364","https://openalex.org/W2147193503","https://openalex.org/W2153667821","https://openalex.org/W2153882937","https://openalex.org/W2167334577","https://openalex.org/W2518567779","https://openalex.org/W3097096317","https://openalex.org/W3143589697","https://openalex.org/W4205317033","https://openalex.org/W4248754567","https://openalex.org/W6674995244","https://openalex.org/W7065096706"],"related_works":["https://openalex.org/W1963859303","https://openalex.org/W2364044215","https://openalex.org/W2389600408","https://openalex.org/W240129890","https://openalex.org/W3048701459","https://openalex.org/W2149078538","https://openalex.org/W2080146221","https://openalex.org/W2370314112","https://openalex.org/W1912958759","https://openalex.org/W2792081825"],"abstract_inverted_index":{"Heterogeneous":[0],"multi-core":[1,140],"systems":[2,141],"that":[3],"contain":[4],"multiple":[5],"CPUs":[6],"and":[7,41,52,108,146,166,170,190,195],"GPUs":[8],"are":[9,14,174],"gaining":[10],"momentum,":[11],"as":[12,50,99],"they":[13],"providing":[15],"different":[16,84],"computation":[17,36],"power":[18,37],"to":[19,32,66,71,93,112,161,176,204,210],"meet":[20],"the":[21,35,45,56,63,67,72,90,95,133,185],"performance":[22],"demand":[23],"of":[24,74,135,187],"modern":[25],"applications.":[26],"On":[27],"such":[28,49,78,98,119],"systems,":[29],"developers":[30,59],"try":[31],"fully":[33],"utilize":[34],"both":[38],"for":[39,102,106,115,138],"CPU":[40,194],"GPU":[42],"by":[43],"using":[44],"emerging":[46],"programming":[47],"models":[48],"CUDA":[51],"OpenCL.":[53],"To":[54],"achieve":[55],"maximal":[57],"performance,":[58],"must":[60],"carefully":[61],"offload":[62],"appropriate":[64],"workload":[65],"compute":[68],"devices":[69],"according":[70],"characteristics":[73],"target":[75,96],"architecture.":[76],"Under":[77],"scenario,":[79],"seamlessly":[80],"data":[81,91,136,188,215],"motion":[82],"between":[83],"processors":[85],"become":[86],"crucial.":[87],"Additionally,":[88],"re-organizing":[89],"layout":[92,191],"fit":[94],"architectures,":[97],"array-of-structure":[100],"(AOS)":[101],"CPU,":[103],"structure-of-array":[104],"(SOA)":[105],"GPU,":[107],"coordinate":[109],"(COO)":[110],"format":[111,148,180],"ELLPACK":[113],"(ELL)":[114],"sparse":[116,147,171,178],"computation,":[117],"address":[118,144,172],"concern.":[120],"In":[121,197],"this":[122],"paper,":[123],"we":[124],"propose":[125],"a":[126,167],"hardware":[127],"memory":[128],"manager,":[129],"which":[130],"efficiently":[131],"optimizes":[132],"conversion":[134,149],"layouts":[137],"heterogeneous":[139],"on-the-fly.":[142],"We":[143],"coalescing":[145],"issue":[150],"in":[151],"our":[152,198,200],"design.":[153],"A":[154],"novel":[155],"ping-pong":[156],"transpose":[157],"architecture":[158],"is":[159],"devised":[160],"reorganize":[162],"non-coalescing":[163],"access":[164],"pattern,":[165],"histogram":[168],"unit":[169],"generator":[173],"presented":[175],"process":[177],"storage":[179],"transformation.":[181],"Our":[182],"design":[183,201],"reduces":[184],"overhead":[186],"transfer":[189],"transformation":[192],"among":[193],"GPU.":[196],"experiment,":[199],"achieves":[202],"68.5":[203],"2.19":[205],"times":[206],"speed":[207],"up":[208],"comparing":[209],"software-based":[211],"library":[212],"depending":[213],"on":[214],"size.":[216]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
