{"id":"https://openalex.org/W2897070804","doi":"https://doi.org/10.1145/3243176.3243180","title":"A portable, automatic data qantizer for deep neural networks","display_name":"A portable, automatic data qantizer for deep neural networks","publication_year":2018,"publication_date":"2018-10-10","ids":{"openalex":"https://openalex.org/W2897070804","doi":"https://doi.org/10.1145/3243176.3243180","mag":"2897070804"},"language":"en","primary_location":{"id":"doi:10.1145/3243176.3243180","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3243176.3243180","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101979936","display_name":"Young H. Oh","orcid":"https://orcid.org/0000-0001-5971-9093"},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Young H. Oh","raw_affiliation_strings":["Sungkyunkwan University, Suwon, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University, Suwon, Korea","institution_ids":["https://openalex.org/I848706"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058029021","display_name":"Quan Quan","orcid":"https://orcid.org/0000-0001-8216-8998"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Quan Quan","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100644919","display_name":"Dae-Yeon Kim","orcid":"https://orcid.org/0000-0001-9396-480X"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Daeyeon Kim","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043497695","display_name":"Seonghak Kim","orcid":"https://orcid.org/0000-0002-0772-7558"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seonghak Kim","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101780114","display_name":"Jun Heo","orcid":"https://orcid.org/0009-0007-7452-3030"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jun Heo","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040276456","display_name":"Sung\u2010jun Jung","orcid":"https://orcid.org/0000-0002-9050-0433"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sungjun Jung","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041407656","display_name":"Jae-Young Jang","orcid":"https://orcid.org/0000-0002-3922-8542"},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaeyoung Jang","raw_affiliation_strings":["Sungkyunkwan University, Suwon, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University, Suwon, Korea","institution_ids":["https://openalex.org/I848706"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100415738","display_name":"Jae Wook Lee","orcid":"https://orcid.org/0000-0002-8756-0195"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jae W. Lee","raw_affiliation_strings":["Seoul National University, Seoul, Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, Korea","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6961,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.88797576,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7755780816078186},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.7066516280174255},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.5862950086593628},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.5654133558273315},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.5077568292617798},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4798933267593384},{"id":"https://openalex.org/keywords/high-memory","display_name":"High memory","score":0.4369751214981079},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.425004780292511},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.411424458026886},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3647320568561554},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3549235463142395},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3419821858406067},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22995898127555847},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10276764631271362}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7755780816078186},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.7066516280174255},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.5862950086593628},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.5654133558273315},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.5077568292617798},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4798933267593384},{"id":"https://openalex.org/C2781357197","wikidata":"https://www.wikidata.org/wiki/Q5757597","display_name":"High memory","level":2,"score":0.4369751214981079},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.425004780292511},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.411424458026886},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3647320568561554},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3549235463142395},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3419821858406067},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22995898127555847},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10276764631271362},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3243176.3243180","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3243176.3243180","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1575833922","https://openalex.org/W1686810756","https://openalex.org/W1799366690","https://openalex.org/W1825672851","https://openalex.org/W1975799560","https://openalex.org/W1976251241","https://openalex.org/W2031489346","https://openalex.org/W2034761517","https://openalex.org/W2048266589","https://openalex.org/W2055312318","https://openalex.org/W2064675550","https://openalex.org/W2070897293","https://openalex.org/W2094756095","https://openalex.org/W2096733369","https://openalex.org/W2097117768","https://openalex.org/W2100218206","https://openalex.org/W2108598243","https://openalex.org/W2119144962","https://openalex.org/W2145339207","https://openalex.org/W2155893237","https://openalex.org/W2156547346","https://openalex.org/W2160815625","https://openalex.org/W2171928131","https://openalex.org/W2177847924","https://openalex.org/W2194775991","https://openalex.org/W2198190323","https://openalex.org/W2246760854","https://openalex.org/W2276486856","https://openalex.org/W2286365479","https://openalex.org/W2291160084","https://openalex.org/W2300242332","https://openalex.org/W2319920447","https://openalex.org/W2330958039","https://openalex.org/W2337344472","https://openalex.org/W2541839172","https://openalex.org/W2560017826","https://openalex.org/W2563587242","https://openalex.org/W2570343428","https://openalex.org/W2585560244","https://openalex.org/W2593245696","https://openalex.org/W2606722458","https://openalex.org/W2607579284","https://openalex.org/W2608702473","https://openalex.org/W2612864759","https://openalex.org/W2618530766","https://openalex.org/W2618564128","https://openalex.org/W2763421725","https://openalex.org/W2793950911","https://openalex.org/W2798956872","https://openalex.org/W2883929540","https://openalex.org/W2951008357","https://openalex.org/W2953212265","https://openalex.org/W2962988160","https://openalex.org/W2964200805","https://openalex.org/W2964228333","https://openalex.org/W3099206234","https://openalex.org/W3118608800","https://openalex.org/W4206821167","https://openalex.org/W4233962317","https://openalex.org/W4251828973","https://openalex.org/W4285719527","https://openalex.org/W4285789112","https://openalex.org/W4294371482","https://openalex.org/W4299545679","https://openalex.org/W4302345030","https://openalex.org/W6600336938","https://openalex.org/W6628107832","https://openalex.org/W6666761814"],"related_works":["https://openalex.org/W4289729660","https://openalex.org/W2887023857","https://openalex.org/W2950000202","https://openalex.org/W4321472478","https://openalex.org/W2034940213","https://openalex.org/W2798332276","https://openalex.org/W4200309432","https://openalex.org/W4387677131","https://openalex.org/W4286229642","https://openalex.org/W2929170389"],"abstract_inverted_index":{"With":[0],"the":[1,141,148,151,165,169,175,182,216,240,261],"proliferation":[2],"of":[3,15,34,48,144,153,184,193,227,236,252,258],"AI-based":[4],"applications":[5],"and":[6,36,62,162],"services,":[7],"there":[8],"are":[9,21],"strong":[10],"demands":[11],"for":[12,77,130,164],"efficient":[13],"processing":[14],"deep":[16],"neural":[17],"networks":[18],"(DNNs).":[19],"DNNs":[20,49],"known":[22],"to":[23,45,71,81,223,239,248],"be":[24],"both":[25,59],"compute-and":[26],"memory-intensive":[27],"as":[28],"they":[29],"require":[30],"a":[31,42,52,68,78,82,106,125,145,156,233,255],"tremendous":[32],"amount":[33],"computation":[35],"large":[37],"memory":[38,63],"space.":[39],"Quantization":[40],"is":[41,67,94,230],"popular":[43],"technique":[44],"boost":[46],"efficiency":[47],"by":[50,97],"representing":[51],"number":[53,75,87,146,166,194],"with":[54,89,232,254],"fewer":[55],"bits,":[56],"hence":[57],"reducing":[58],"computational":[60],"strength":[61],"footprint.":[64],"However,":[65],"it":[66],"difficult":[69],"task":[70],"find":[72],"an":[73,186,207,249],"optimal":[74],"representation":[76,143,158],"DNN":[79,108,188,200,204],"due":[80],"combinatorial":[83],"explosion":[84],"in":[85,215],"feasible":[86],"representations":[88],"varying":[90],"bit":[91,160],"widths,":[92],"which":[93],"only":[95,265],"exacerbated":[96],"layer-wise":[98],"optimization.":[99],"Besides,":[100],"existing":[101],"quantization":[102,128],"techniques":[103],"often":[104],"target":[105],"specific":[107],"framework":[109,129],"and/or":[110],"hardware":[111],"platform,":[112],"lacking":[113],"portability":[114],"across":[115],"various":[116],"execution":[117],"environments.":[118],"To":[119],"address":[120],"this,":[121],"we":[122],"propose":[123],"libnumber,":[124],"portable,":[126],"automatic":[127],"DNNs.":[131],"By":[132],"introducing":[133],"Number":[134],"abstract":[135],"data":[136],"type":[137],"(ADT),":[138],"libnumber":[139,154,179],"encapsulates":[140],"internal":[142],"from":[147,190],"user.":[149],"Then":[150],"auto-tuner":[152],"finds":[155],"compact":[157],"(type,":[159],"width,":[161],"bias)":[163],"that":[167],"minimizes":[168],"user-supplied":[170],"objective":[171],"function,":[172],"while":[173,263],"satisfying":[174],"accuracy":[176,229],"constraint.":[177],"Thus,":[178],"effectively":[180],"separates":[181],"concern":[183],"developing":[185],"effective":[187],"model":[189],"low-level":[191],"optimization":[192],"representation.":[195],"Our":[196],"evaluation":[197],"using":[198,242],"eleven":[199],"models":[201],"on":[202,219],"two":[203],"frameworks":[205],"targeting":[206],"FPGA":[208],"platform":[209],"demonstrates":[210],"over":[211,260],"8\u00d7":[212],"(7\u00d7)":[213],"reduction":[214,235],"parameter":[217],"size":[218],"average":[220],"when":[221],"up":[222],"7%":[224],"(1%)":[225],"loss":[226],"relative":[228],"tolerable,":[231],"maximum":[234,256],"16\u00d7,":[237],"compared":[238],"baseline":[241],"32-bit":[243],"floating-point":[244],"numbers.":[245],"This":[246],"leads":[247],"geomean":[250],"speedup":[251,257],"3.79\u00d7":[253],"12.77\u00d7":[259],"baseline,":[262],"requiring":[264],"minimal":[266],"programmer":[267],"effort.":[268]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
