{"id":"https://openalex.org/W7141670745","doi":"https://doi.org/10.1109/icce67443.2026.11449825","title":"Enabling On-Chip Data Sharing on GPU for On-Device Training","display_name":"Enabling On-Chip Data Sharing on GPU for On-Device Training","publication_year":2026,"publication_date":"2026-02-03","ids":{"openalex":"https://openalex.org/W7141670745","doi":"https://doi.org/10.1109/icce67443.2026.11449825"},"language":null,"primary_location":{"id":"doi:10.1109/icce67443.2026.11449825","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icce67443.2026.11449825","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Conference on Consumer Electronics (ICCE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044670967","display_name":"Jiho Yoo","orcid":"https://orcid.org/0000-0003-4873-9157"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jeongjoon Yoo","raw_affiliation_strings":["Samsung Electronics,Hwasung,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Hwasung,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130780454","display_name":"Isaac Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Isaac Hong","raw_affiliation_strings":["Samsung Electronics,Hwasung,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Hwasung,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5044670967"],"corresponding_institution_ids":["https://openalex.org/I2250650973"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.91414268,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11283","display_name":"Experimental Learning in Engineering","score":0.05979999899864197,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11283","display_name":"Experimental Learning in Engineering","score":0.05979999899864197,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13937","display_name":"Genetics, Bioinformatics, and Biomedical Research","score":0.05420000106096268,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T14067","display_name":"Cloud Computing and Remote Desktop Technologies","score":0.037300001829862595,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5315999984741211},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data sharing","score":0.32519999146461487},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.28999999165534973},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.24940000474452972},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.24500000476837158}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6870999932289124},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5315999984741211},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.32519999146461487},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2856999933719635},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2605000138282776},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.24940000474452972},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.24500000476837158},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.24040000140666962},{"id":"https://openalex.org/C163985040","wikidata":"https://www.wikidata.org/wiki/Q1172399","display_name":"Data acquisition","level":2,"score":0.2337000072002411}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icce67443.2026.11449825","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icce67443.2026.11449825","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Conference on Consumer Electronics (ICCE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W4229055905","https://openalex.org/W4408861043"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,35],"propose":[4],"a":[5,41,85],"GPU":[6],"architecture":[7],"specifically":[8],"optimized":[9],"for":[10],"on-device":[11,82],"training,":[12],"addressing":[13],"the":[14,65,87,95],"performance":[15,77],"degradation":[16],"and":[17,52,73,78],"excessive":[18],"power":[19,96],"consumption":[20,97],"of":[21],"conventional":[22],"mobile":[23],"GPUs":[24],"caused":[25],"by":[26,92,100],"frequent":[27],"global":[28,57],"memory":[29,44,70],"accesses.":[30],"To":[31],"mitigate":[32],"these":[33],"issues,":[34],"introduce":[36],"Kernel":[37],"Shared":[38],"Memory":[39],"(KSM),":[40],"novel":[42],"on-chip":[43],"that":[45],"enables":[46],"direct":[47],"data":[48,62],"exchange":[49],"between":[50],"producer":[51],"consumer":[53],"kernels":[54],"without":[55],"accessing":[56],"memory.":[58],"By":[59],"allowing":[60],"inter-kernel":[61],"sharing":[63],"within":[64],"GPU,":[66],"KSM":[67],"effectively":[68],"reduces":[69],"access":[71],"latency":[72],"significantly":[74],"improves":[75],"both":[76],"energy":[79],"efficiency":[80],"during":[81],"training.":[83],"As":[84],"result,":[86],"execution":[88],"time":[89],"is":[90,98],"improved":[91],"2.9x,":[93],"while":[94],"reduced":[99],"more":[101],"than":[102],"50%.":[103]},"counts_by_year":[],"updated_date":"2026-03-29T06:01:01.467347","created_date":"2026-03-28T00:00:00"}
