{"id":"https://openalex.org/W2944280939","doi":"https://doi.org/10.1145/3310273.3321563","title":"Iterative machine learning (IterML) for effective parameter pruning and tuning in accelerators","display_name":"Iterative machine learning (IterML) for effective parameter pruning and tuning in accelerators","publication_year":2019,"publication_date":"2019-04-30","ids":{"openalex":"https://openalex.org/W2944280939","doi":"https://doi.org/10.1145/3310273.3321563","mag":"2944280939"},"language":"en","primary_location":{"id":"doi:10.1145/3310273.3321563","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3310273.3321563","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3310273.3321563","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th ACM International Conference on Computing Frontiers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3310273.3321563","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024705915","display_name":"Xuewen Cui","orcid":"https://orcid.org/0000-0002-0173-5215"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xuewen Cui","raw_affiliation_strings":["Virginia Tech"],"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058539554","display_name":"Wu-chun Feng","orcid":"https://orcid.org/0000-0002-6015-0727"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wu-chun Feng","raw_affiliation_strings":["Virginia Tech"],"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5024705915"],"corresponding_institution_ids":["https://openalex.org/I859038795"],"apc_list":null,"apc_paid":null,"fwci":0.9631,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.72384555,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"16","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9861000180244446,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8238139152526855},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.7549700736999512},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.667697012424469},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5799863934516907},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5392301082611084},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.5007269382476807},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4829522967338562},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.44941601157188416},{"id":"https://openalex.org/keywords/optimizing-compiler","display_name":"Optimizing compiler","score":0.440559059381485},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.43801695108413696},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.41927406191825867},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2883966565132141},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1150347888469696}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8238139152526855},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.7549700736999512},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.667697012424469},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5799863934516907},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5392301082611084},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.5007269382476807},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4829522967338562},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.44941601157188416},{"id":"https://openalex.org/C190902152","wikidata":"https://www.wikidata.org/wiki/Q1325106","display_name":"Optimizing compiler","level":3,"score":0.440559059381485},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.43801695108413696},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.41927406191825867},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2883966565132141},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1150347888469696},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3310273.3321563","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3310273.3321563","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3310273.3321563","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th ACM International Conference on Computing Frontiers","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3310273.3321563","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3310273.3321563","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3310273.3321563","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th ACM International Conference on Computing Frontiers","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.44999998807907104,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2944280939.pdf","grobid_xml":"https://content.openalex.org/works/W2944280939.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W57243869","https://openalex.org/W1541729506","https://openalex.org/W1863336885","https://openalex.org/W2050127041","https://openalex.org/W2070544163","https://openalex.org/W2096858484","https://openalex.org/W2101234009","https://openalex.org/W2128539477","https://openalex.org/W2153492376","https://openalex.org/W2167334577","https://openalex.org/W2623016866","https://openalex.org/W2725757310","https://openalex.org/W2732023272","https://openalex.org/W2733653163","https://openalex.org/W2767897789","https://openalex.org/W2808350202","https://openalex.org/W2885840893","https://openalex.org/W2997701623","https://openalex.org/W4243261006","https://openalex.org/W6675354045"],"related_works":["https://openalex.org/W2479014312","https://openalex.org/W1583465708","https://openalex.org/W2082035004","https://openalex.org/W4236710543","https://openalex.org/W1547259518","https://openalex.org/W4230029438","https://openalex.org/W4240445122","https://openalex.org/W4232891356","https://openalex.org/W3033052750","https://openalex.org/W1582485370"],"abstract_inverted_index":{"With":[0],"the":[1,13,40,48,54,61,95,113,121],"rise":[2],"of":[3,42,83,115,124],"accelerators":[4],"(e.g.,":[5,106],"GPUs,":[6],"FPGAs,":[7],"and":[8,20,50,73,80,110],"APUs)":[9],"in":[10,86],"computing":[11,15,84],"systems,":[12],"parallel":[14],"community":[16],"needs":[17],"better":[18],"tools":[19],"mechanisms":[21],"with":[22],"which":[23],"to":[24,33,37,53,76,88,118,133],"productively":[25],"extract":[26],"performance.":[27,91],"While":[28],"modern":[29],"compilers":[30],"provide":[31],"flags":[32],"activate":[34],"different":[35],"optimizations":[36,125],"improve":[38,89],"performance,":[39],"effectiveness":[41],"such":[43],"automated":[44],"optimization":[45,137],"depends":[46],"on":[47,67,97,100],"algorithm":[49,66,99],"its":[51],"mapping":[52],"underlying":[55],"accelerator":[56,69,102],"architecture.":[57],"Currently,":[58],"however,":[59],"extracting":[60],"best":[62],"performance":[63,96],"from":[64],"an":[65,68,98,101],"requires":[70,103],"significant":[71],"expertise":[72],"manual":[74],"effort":[75],"exploit":[77],"both":[78],"spatial":[79],"temporal":[81],"sharing":[82],"resources":[85],"order":[87],"overall":[90],"In":[92],"particular,":[93],"maximizing":[94],"extensive":[104],"hyperparameter":[105,116],"thread-block":[107],"size)":[108],"selection":[109],"tuning.":[111],"Given":[112],"myriad":[114],"dimensions":[117],"optimize":[119],"across,":[120],"search":[122],"space":[123],"is":[126],"generally":[127],"extremely":[128],"large,":[129],"making":[130],"it":[131],"infeasible":[132],"exhaustively":[134],"evaluate":[135],"each":[136],"configuration.":[138]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
