{"id":"https://openalex.org/W4360831992","doi":"https://doi.org/10.1109/hpca56546.2023.10071080","title":"ISOSceles: Accelerating Sparse CNNs through Inter-Layer Pipelining","display_name":"ISOSceles: Accelerating Sparse CNNs through Inter-Layer Pipelining","publication_year":2023,"publication_date":"2023-02-01","ids":{"openalex":"https://openalex.org/W4360831992","doi":"https://doi.org/10.1109/hpca56546.2023.10071080"},"language":"en","primary_location":{"id":"doi:10.1109/hpca56546.2023.10071080","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10071080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100743976","display_name":"Yifan Yang","orcid":"https://orcid.org/0000-0002-8986-191X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yifan Yang","raw_affiliation_strings":["MIT CSAIL"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024384625","display_name":"Joel Emer","orcid":null},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Joel S. Emer","raw_affiliation_strings":["MIT CSAIL / NVIDIA"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL / NVIDIA","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051586110","display_name":"Daniel S\u00e1nchez","orcid":"https://orcid.org/0000-0002-6048-3994"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daniel Sanchez","raw_affiliation_strings":["MIT CSAIL"],"affiliations":[{"raw_affiliation_string":"MIT CSAIL","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100743976"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.9038,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.92622136,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"598","last_page":"610"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8100579977035522},{"id":"https://openalex.org/keywords/isosceles-triangle","display_name":"Isosceles triangle","score":0.8006647825241089},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.7269300222396851},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.644317090511322},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.587149441242218},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4615175426006317},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4454715847969055},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4107286036014557},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.09400933980941772},{"id":"https://openalex.org/keywords/nanotechnology","display_name":"Nanotechnology","score":0.08104446530342102}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8100579977035522},{"id":"https://openalex.org/C98653994","wikidata":"https://www.wikidata.org/wiki/Q875937","display_name":"Isosceles triangle","level":2,"score":0.8006647825241089},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.7269300222396851},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.644317090511322},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.587149441242218},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4615175426006317},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4454715847969055},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4107286036014557},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.09400933980941772},{"id":"https://openalex.org/C171250308","wikidata":"https://www.wikidata.org/wiki/Q11468","display_name":"Nanotechnology","level":1,"score":0.08104446530342102},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca56546.2023.10071080","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10071080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.4699999988079071,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306087","display_name":"Semiconductor Research Corporation","ror":"https://ror.org/047z4n946"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W2048266589","https://openalex.org/W2097117768","https://openalex.org/W2108598243","https://openalex.org/W2150348132","https://openalex.org/W2194775991","https://openalex.org/W2245094585","https://openalex.org/W2442974303","https://openalex.org/W2516141709","https://openalex.org/W2541839172","https://openalex.org/W2590246587","https://openalex.org/W2777372517","https://openalex.org/W2794952988","https://openalex.org/W2898123186","https://openalex.org/W2935331687","https://openalex.org/W2940862705","https://openalex.org/W2945146780","https://openalex.org/W2953212265","https://openalex.org/W2963363373","https://openalex.org/W2963367920","https://openalex.org/W2979310060","https://openalex.org/W2979439447","https://openalex.org/W3015783148","https://openalex.org/W3016832937","https://openalex.org/W3103168911","https://openalex.org/W3121402054","https://openalex.org/W3155922894","https://openalex.org/W3187481008","https://openalex.org/W3187908937","https://openalex.org/W3188321821","https://openalex.org/W3206290655","https://openalex.org/W3207265322","https://openalex.org/W4212788319","https://openalex.org/W4236868170","https://openalex.org/W4240168186","https://openalex.org/W4247470470","https://openalex.org/W4249932213","https://openalex.org/W4254260720","https://openalex.org/W4297775537","https://openalex.org/W4300171661","https://openalex.org/W6637242042","https://openalex.org/W6637373629","https://openalex.org/W6677580257","https://openalex.org/W6737664043","https://openalex.org/W6773667195"],"related_works":["https://openalex.org/W2795405095","https://openalex.org/W2263342410","https://openalex.org/W2991387667","https://openalex.org/W2795954609","https://openalex.org/W4287901079","https://openalex.org/W134513340","https://openalex.org/W3002130224","https://openalex.org/W4381295707","https://openalex.org/W2293118914","https://openalex.org/W2150836909"],"abstract_inverted_index":{"Sparse":[0],"CNNs":[1,15],"dramatically":[2,50],"reduce":[3],"computation":[4],"and":[5,111,129,132,165],"storage":[6],"costs":[7],"over":[8,122],"dense":[9,97],"ones.":[10],"But":[11],"sparsity":[12,146],"also":[13],"makes":[14],"more":[16],"data-intensive,":[17],"as":[18],"each":[19],"value":[20],"is":[21,86],"reused":[22],"fewer":[23],"times.":[24],"Thus,":[25],"current":[26],"sparse":[27,46,152],"CNN":[28,47],"accelerators,":[29],"which":[30,93],"process":[31],"one":[32],"layer":[33,75],"at":[34],"a":[35,44,65,102,148,156],"time,":[36],"are":[37,69,94],"bottlenecked":[38],"by":[39,72,159,168],"memory":[40],"traffic.We":[41],"present":[42],"ISOSceles,":[43],"new":[45],"accelerator":[48,158],"that":[49,64,108,145],"reduces":[51,166],"data":[52],"movement":[53],"through":[54],"inter-layer":[55],"pipelining:":[56],"overlapping":[57],"the":[58,73,115,140],"execution":[59],"of":[60,151],"consecutive":[61],"layers":[62,138],"so":[63],"layer\u2019s":[66],"output":[67],"activations":[68],"quickly":[70],"consumed":[71],"next":[74],"without":[76],"spilling":[77],"them":[78],"off-chip.":[79],"Pipelining":[80],"greatly":[81,118],"increases":[82],"reuse,":[83],"but":[84],"it":[85],"challenging":[87],"to":[88,96,135,163,171],"implement":[89],"with":[90],"existing":[91,123],"approaches,":[92],"limited":[95],"CNNs.":[98],"ISOSceles":[99,125,154],"relies":[100],"on":[101],"novel":[103],"input-stationary":[104],"output-stationary":[105],"(IS-OS)":[106],"dataflow":[107],"consumes":[109],"inputs":[110],"produces":[112],"outputs":[113],"in":[114,143],"same":[116],"order,":[117],"reducing":[119],"intermediate":[120],"sizes":[121],"dataflows.":[124],"implements":[126],"IS-OS":[127],"efficiently":[128],"leverages":[130],"time-multiplexing":[131],"dynamic":[133],"scheduling":[134],"pipeline":[136],"multiple":[137],"despite":[139],"large":[141],"variations":[142],"work":[144],"induces.On":[147],"wide":[149],"range":[150],"CNNs,":[153],"outperforms":[155],"state-of-the-art":[157],"gmean":[160],"4.3\u00d7":[161],"(up":[162,170],"6.7\u00d7),":[164],"traffic":[167],"4.7\u00d7":[169],"8.5\u00d7)":[172],"while":[173],"using":[174],"less":[175],"area.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":4}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
