{"id":"https://openalex.org/W4233748228","doi":"https://doi.org/10.1109/aspdac.2018.8297377","title":"Accelerator-centric deep learning systems for enhanced scalability, energy-efficiency, and programmability","display_name":"Accelerator-centric deep learning systems for enhanced scalability, energy-efficiency, and programmability","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W4233748228","doi":"https://doi.org/10.1109/aspdac.2018.8297377"},"language":"en","primary_location":{"id":"doi:10.1109/aspdac.2018.8297377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aspdac.2018.8297377","pdf_url":null,"source":{"id":"https://openalex.org/S4363608266","display_name":"2018 23rd Asia and South Pacific Design Automation Conference (ASP-DAC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 23rd Asia and South Pacific Design Automation Conference (ASP-DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091648103","display_name":"Minsoo Rhu","orcid":"https://orcid.org/0000-0003-3303-8681"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]},{"id":"https://openalex.org/I2799891827","display_name":"Korea Post","ror":"https://ror.org/00p45d091","country_code":"KR","type":"government","lineage":["https://openalex.org/I2799891827","https://openalex.org/I2801339556","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Minsoo Rhu","raw_affiliation_strings":["POSTECH"],"affiliations":[{"raw_affiliation_string":"POSTECH","institution_ids":["https://openalex.org/I2799891827","https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5091648103"],"corresponding_institution_ids":["https://openalex.org/I123900574","https://openalex.org/I2799891827"],"apc_list":null,"apc_paid":null,"fwci":0.1204,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.54010695,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"527","last_page":"533"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8236823081970215},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7867144346237183},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6081734895706177},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5951513648033142},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5584537386894226},{"id":"https://openalex.org/keywords/application-specific-integrated-circuit","display_name":"Application-specific integrated circuit","score":0.525917649269104},{"id":"https://openalex.org/keywords/virtualization","display_name":"Virtualization","score":0.49667125940322876},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.48013779520988464},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.4691326320171356},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.44334906339645386},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.42844825983047485},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32871776819229126},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.24515420198440552},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.09916827082633972},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.08502727746963501},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08280321955680847}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8236823081970215},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7867144346237183},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6081734895706177},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5951513648033142},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5584537386894226},{"id":"https://openalex.org/C77390884","wikidata":"https://www.wikidata.org/wiki/Q217302","display_name":"Application-specific integrated circuit","level":2,"score":0.525917649269104},{"id":"https://openalex.org/C513985346","wikidata":"https://www.wikidata.org/wiki/Q270471","display_name":"Virtualization","level":3,"score":0.49667125940322876},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.48013779520988464},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.4691326320171356},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.44334906339645386},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.42844825983047485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32871776819229126},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.24515420198440552},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.09916827082633972},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.08502727746963501},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08280321955680847},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/aspdac.2018.8297377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aspdac.2018.8297377","pdf_url":null,"source":{"id":"https://openalex.org/S4363608266","display_name":"2018 23rd Asia and South Pacific Design Automation Conference (ASP-DAC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 23rd Asia and South Pacific Design Automation Conference (ASP-DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8700000047683716,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1442374986","https://openalex.org/W1686810756","https://openalex.org/W1789336918","https://openalex.org/W1981220134","https://openalex.org/W2079735306","https://openalex.org/W2097117768","https://openalex.org/W2162390675","https://openalex.org/W2163605009","https://openalex.org/W2168231600","https://openalex.org/W2172654076","https://openalex.org/W2186615578","https://openalex.org/W2194775991","https://openalex.org/W2235673048","https://openalex.org/W2285660444","https://openalex.org/W2300242332","https://openalex.org/W2330672121","https://openalex.org/W2489529491","https://openalex.org/W2516141709","https://openalex.org/W2535374105","https://openalex.org/W2606722458","https://openalex.org/W2625457103","https://openalex.org/W2753665345","https://openalex.org/W2763421725","https://openalex.org/W2952230511","https://openalex.org/W2962736495","https://openalex.org/W2962758826","https://openalex.org/W2962821792","https://openalex.org/W2962911728","https://openalex.org/W2963526839","https://openalex.org/W4240168186","https://openalex.org/W4293318097","https://openalex.org/W6628377381","https://openalex.org/W6683722107","https://openalex.org/W6684191040","https://openalex.org/W6684859321","https://openalex.org/W6686509673","https://openalex.org/W6697071109","https://openalex.org/W6698200048"],"related_works":["https://openalex.org/W2595172197","https://openalex.org/W2084856301","https://openalex.org/W2127970246","https://openalex.org/W4382618745","https://openalex.org/W2885125400","https://openalex.org/W1001352512","https://openalex.org/W1989889224","https://openalex.org/W2748922771","https://openalex.org/W1987128138","https://openalex.org/W2743976221"],"abstract_inverted_index":{"Deep":[0],"learning":[1,192],"(DL)":[2],"has":[3],"been":[4],"successfully":[5],"deployed":[6],"in":[7,41],"various":[8],"application":[9],"domains":[10],"ranging":[11],"from":[12],"computer":[13],"vision,":[14],"speech":[15],"recognition,":[16],"to":[17,29],"natural":[18],"language":[19],"processing.":[20],"As":[21],"the":[22,26,57,66,71,77,96,106,132,139,153,184],"network":[23],"models":[24,32],"and":[25,45,105,137,173,189],"datasets":[27],"used":[28],"train":[30],"these":[31],"scale,":[33],"system":[34,50,177,193],"architects":[35],"are":[36,63],"faced":[37],"with":[38],"new":[39],"challenges":[40,166],"designing":[42,120],"a":[43,84,146,179,187],"scalable":[44,121,188],"energy-efficient":[46,190],"high-performance":[47],"computing":[48],"(HPC)":[49],"for":[51,124,183],"training":[52],"DL":[53,61,79,176],"algorithms.":[54],"One":[55],"of":[56,76,156,186],"key":[58],"obstacles":[59],"that":[60,98,150],"researchers":[62],"facing":[64],"is":[65],"memory":[67,74,133,147,154,168],"capacity":[68,134],"bottleneck,":[69],"where":[70],"limited":[72],"physical":[73],"size":[75],"PCIe-attached":[78],"accelerator":[80,89],"(whether":[81],"it":[82],"be":[83,100],"discrete":[85],"GPU":[86],"or":[87],"ASIC":[88],"like":[90],"Google's":[91],"Tensor":[92],"Processing":[93],"Unit)":[94],"constrains":[95],"algorithm":[97],"can":[99],"studied.":[101],"In":[102,126],"this":[103,127],"paper,":[104],"associated":[107],"invited":[108],"special":[109],"session":[110],"talk,":[111],"we":[112,129],"first":[113],"discuss":[114,131],"recent":[115],"research":[116,181],"literature":[117],"geared":[118],"towards":[119],"HPC":[122],"systems":[123],"DL.":[125],"context,":[128],"then":[130],"wall":[135],"problem":[136],"introduce":[138],"work":[140],"on":[141,164],"virtualized":[142],"deep":[143,191],"neural":[144],"networks,":[145],"virtualization":[148,169],"solution":[149],"systematically":[151],"reduces":[152],"consumption":[155],"DNN":[157,167],"training.":[158],"We":[159],"conclude":[160],"by":[161],"providing":[162],"projections":[163],"future":[165],"will":[170],"encounter":[171],"upon":[172],"suggest":[174],"accelerator-centric":[175],"as":[178],"promising":[180],"direction":[182],"development":[185],"architecture.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
