{"id":"https://openalex.org/W4414199176","doi":"https://doi.org/10.1109/dac63849.2025.11133184","title":"Precon: A Precision-Convertible Architecture for Accelerating Quantized Deep Learning Models across Various Domains Including LLMs","display_name":"Precon: A Precision-Convertible Architecture for Accelerating Quantized Deep Learning Models across Various Domains Including LLMs","publication_year":2025,"publication_date":"2025-06-22","ids":{"openalex":"https://openalex.org/W4414199176","doi":"https://doi.org/10.1109/dac63849.2025.11133184"},"language":"en","primary_location":{"id":"doi:10.1109/dac63849.2025.11133184","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11133184","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101938959","display_name":"Jongwoo Park","orcid":"https://orcid.org/0009-0006-7558-3804"},"institutions":[{"id":"https://openalex.org/I35928602","display_name":"Kyung Hee University","ror":"https://ror.org/01zqcg218","country_code":"KR","type":"education","lineage":["https://openalex.org/I35928602"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jongwoo Park","raw_affiliation_strings":["Kyung Hee University,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Kyung Hee University,Republic of Korea","institution_ids":["https://openalex.org/I35928602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103126454","display_name":"Hyeonseong Kim","orcid":"https://orcid.org/0000-0002-9160-8876"},"institutions":[{"id":"https://openalex.org/I35928602","display_name":"Kyung Hee University","ror":"https://ror.org/01zqcg218","country_code":"KR","type":"education","lineage":["https://openalex.org/I35928602"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyeonseong Kim","raw_affiliation_strings":["Kyung Hee University,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Kyung Hee University,Republic of Korea","institution_ids":["https://openalex.org/I35928602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112534520","display_name":"Jiyun Han","orcid":null},"institutions":[{"id":"https://openalex.org/I35928602","display_name":"Kyung Hee University","ror":"https://ror.org/01zqcg218","country_code":"KR","type":"education","lineage":["https://openalex.org/I35928602"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jiyun Han","raw_affiliation_strings":["Kyung Hee University,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Kyung Hee University,Republic of Korea","institution_ids":["https://openalex.org/I35928602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034558336","display_name":"Seungkyu Choi","orcid":"https://orcid.org/0000-0002-3125-9707"},"institutions":[{"id":"https://openalex.org/I35928602","display_name":"Kyung Hee University","ror":"https://ror.org/01zqcg218","country_code":"KR","type":"education","lineage":["https://openalex.org/I35928602"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seungkyu Choi","raw_affiliation_strings":["Kyung Hee University,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Kyung Hee University,Republic of Korea","institution_ids":["https://openalex.org/I35928602"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101938959"],"corresponding_institution_ids":["https://openalex.org/I35928602"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23975248,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.8259999752044678,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.8259999752044678,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.78329998254776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.7360000014305115,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dac63849.2025.11133184","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11133184","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2563860341","https://openalex.org/W2963163009","https://openalex.org/W2963367920","https://openalex.org/W3160017297","https://openalex.org/W3190062760","https://openalex.org/W3201271601","https://openalex.org/W4238341497","https://openalex.org/W4313069943","https://openalex.org/W4360831844","https://openalex.org/W4393407021","https://openalex.org/W4404738510"],"related_works":[],"abstract_inverted_index":{"The":[0],"sensitivity":[1],"of":[2,10,103,109],"LLMs":[3],"to":[4,42,83,94],"quantization":[5,21],"has":[6],"driven":[7],"the":[8,68,95,101],"development":[9],"hardware":[11,30],"accelerators":[12],"tailored":[13],"for":[14],"specific":[15],"low-precision":[16],"configurations":[17],"such":[18],"as":[19],"weight-only":[20],"and":[22,64,74,87,106],"mixed-precision,":[23],"which":[24],"can":[25],"introduce":[26],"inefficiencies":[27],"in":[28,90],"dedicated":[29],"architecture.":[31],"In":[32],"this":[33],"work,":[34],"we":[35],"propose":[36],"Precon,":[37],"a":[38,52],"precision-convertible":[39],"architecture":[40],"designed":[41],"accelerate":[43],"various":[44,98],"quantized":[45,110],"deep":[46],"learning":[47],"models,":[48],"particularly":[49],"LLMs,":[50],"through":[51],"unified":[53],"processing":[54],"unit.":[55],"By":[56],"enabling":[57],"on-the-fly":[58],"switching":[59],"between":[60],"half-float":[61],"(FP16)":[62],"decoding":[63],"integer":[65],"(INT)":[66],"decomposition,":[67],"design":[69],"effectively":[70],"supports":[71],"INT4-FP16,":[72],"INT4-INT4,":[73],"INT4INT8":[75],"arithmetic":[76],"within":[77],"shared":[78],"logic.":[79],"Precon":[80],"achieves":[81],"up":[82],"$4.1":[84],"\\times$":[85],"speedup":[86],"81.4%":[88],"reduction":[89],"energy":[91],"consumption":[92],"compared":[93],"baseline":[96],"across":[97],"domains,":[99],"including":[100],"support":[102],"both":[104],"accurate":[105],"efficient":[107],"acceleration":[108],"LLMs.":[111]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
