{"id":"https://openalex.org/W4210486199","doi":"https://doi.org/10.1145/3508390","title":"TAB: Unified and Optimized Ternary, Binary, and Mixed-precision Neural Network Inference on the Edge","display_name":"TAB: Unified and Optimized Ternary, Binary, and Mixed-precision Neural Network Inference on the Edge","publication_year":2022,"publication_date":"2022-01-26","ids":{"openalex":"https://openalex.org/W4210486199","doi":"https://doi.org/10.1145/3508390"},"language":"en","primary_location":{"id":"doi:10.1145/3508390","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3508390","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3508390","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3508390","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087479741","display_name":"Shien Zhu","orcid":"https://orcid.org/0000-0002-2094-7643"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Shien Zhu","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-2094-7643","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016725699","display_name":"Luan H. K. Duong","orcid":"https://orcid.org/0000-0003-4731-1896"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Luan H. K. Duong","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038598144","display_name":"Weichen Liu","orcid":"https://orcid.org/0000-0001-9348-4662"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Weichen Liu","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-9348-4662","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087479741"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":0.8122,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.71791597,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"21","issue":"5","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ternary-operation","display_name":"Ternary operation","score":0.6656290292739868},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6249402165412903},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.5249521732330322},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5117371082305908},{"id":"https://openalex.org/keywords/bitwise-operation","display_name":"Bitwise operation","score":0.47639837861061096},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4425647556781769},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.409854531288147},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.23432418704032898},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.23410093784332275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.14350458979606628}],"concepts":[{"id":"https://openalex.org/C64452783","wikidata":"https://www.wikidata.org/wiki/Q1524945","display_name":"Ternary operation","level":2,"score":0.6656290292739868},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6249402165412903},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.5249521732330322},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5117371082305908},{"id":"https://openalex.org/C134765980","wikidata":"https://www.wikidata.org/wiki/Q879126","display_name":"Bitwise operation","level":2,"score":0.47639837861061096},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4425647556781769},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.409854531288147},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.23432418704032898},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.23410093784332275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.14350458979606628},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3508390","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3508390","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3508390","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/155648","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/155648","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":{"id":"doi:10.1145/3508390","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3508390","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3508390","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1482925484","display_name":null,"funder_award_id":"Tier 1","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"},{"id":"https://openalex.org/G3048563442","display_name":null,"funder_award_id":"Tier 1","funder_id":"https://openalex.org/F4320320766","funder_display_name":"Nanyang Technological University"},{"id":"https://openalex.org/G5678059841","display_name":null,"funder_award_id":"NAP (M4082282), and SUG (M4082087)","funder_id":"https://openalex.org/F4320320766","funder_display_name":"Nanyang Technological University"},{"id":"https://openalex.org/G6854926366","display_name":null,"funder_award_id":"Tier 2","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"},{"id":"https://openalex.org/G739051916","display_name":null,"funder_award_id":"M4082282","funder_id":"https://openalex.org/F4320320766","funder_display_name":"Nanyang Technological University"},{"id":"https://openalex.org/G7761738211","display_name":null,"funder_award_id":"MOE2019-T2-1-071, and MOE2019-T1-001-072","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"},{"id":"https://openalex.org/G8867963434","display_name":null,"funder_award_id":"M4082087","funder_id":"https://openalex.org/F4320320766","funder_display_name":"Nanyang Technological University"}],"funders":[{"id":"https://openalex.org/F4320320751","display_name":"Ministry of Education - Singapore","ror":"https://ror.org/01kcva023"},{"id":"https://openalex.org/F4320320766","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302"},{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4210486199.pdf","grobid_xml":"https://content.openalex.org/works/W4210486199.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W1863336885","https://openalex.org/W2079658918","https://openalex.org/W2300242332","https://openalex.org/W2469490737","https://openalex.org/W2499931820","https://openalex.org/W2618939455","https://openalex.org/W2786771851","https://openalex.org/W2884150179","https://openalex.org/W2886014761","https://openalex.org/W2887447938","https://openalex.org/W2896457183","https://openalex.org/W2896934366","https://openalex.org/W2903462692","https://openalex.org/W2954048742","https://openalex.org/W2962939807","https://openalex.org/W2963480671","https://openalex.org/W2963526839","https://openalex.org/W2982165597","https://openalex.org/W2995492582","https://openalex.org/W2997394738","https://openalex.org/W3008591352","https://openalex.org/W3017746288","https://openalex.org/W3026337110","https://openalex.org/W3034297393","https://openalex.org/W3034933748","https://openalex.org/W3034971973","https://openalex.org/W3035232708","https://openalex.org/W3036601975","https://openalex.org/W3128120039","https://openalex.org/W3135547017","https://openalex.org/W3137147200","https://openalex.org/W3151873305","https://openalex.org/W3173877717","https://openalex.org/W3174071941","https://openalex.org/W3184606595","https://openalex.org/W3211127556","https://openalex.org/W4214539264","https://openalex.org/W4233358539","https://openalex.org/W4287254789","https://openalex.org/W4288346545","https://openalex.org/W4295262505","https://openalex.org/W6693397755","https://openalex.org/W6763653508","https://openalex.org/W6782332983"],"related_works":["https://openalex.org/W1594590521","https://openalex.org/W2161073421","https://openalex.org/W2059661740","https://openalex.org/W4287750387","https://openalex.org/W3039944263","https://openalex.org/W2044964419","https://openalex.org/W2023587177","https://openalex.org/W2732529307","https://openalex.org/W2993803155","https://openalex.org/W4321521078"],"abstract_inverted_index":{"Ternary":[0,6],"Neural":[1,17],"Networks":[2,8,18],"(TNNs)":[3],"and":[4,24,35,43,55,60,92,98,112,119,132,151,164,182,225,237,250,264,273,285],"mixed-precision":[5,94,120],"Binary":[7,16],"(TBNs)":[9],"have":[10,29],"demonstrated":[11],"higher":[12],"accuracy":[13,32],"compared":[14,255],"to":[15,87,172,193,247,270,282],"(BNNs)":[19],"while":[20,293],"providing":[21],"fast,":[22],"low-power,":[23],"memory-efficient":[25],"inference.":[26],"Related":[27],"works":[28,64],"improved":[30],"the":[31,53,66,162,168,174,180,213,295],"of":[33,167],"TNNs":[34,59],"TBNs,":[36],"but":[37],"overlooked":[38],"their":[39],"optimizations":[40],"on":[41,138,189,235,291],"CPU":[42,236],"GPU":[44,238],"platforms.":[45,140],"First,":[46],"there":[47],"is":[48,101,209,280,299],"no":[49],"unified":[50,111,125],"encoding":[51],"for":[52,83,116,145,307],"binary":[54,99,150,183],"ternary":[56,84,97,152,169,181,215],"values":[57,85,100,170],"in":[58,71,75,266],"TBNs.":[61],"Second,":[62],"existing":[63,311],"store":[65],"2-bit":[67,81],"quantized":[68],"data":[69,129,158],"sequentially":[70],"32/64-bit":[72],"integers,":[73],"resulting":[74],"bit-extraction":[76],"overhead.":[77,177],"Last,":[78],"adopting":[79],"standard":[80],"multiplications":[82],"leads":[86],"a":[88,110,156,303],"complex":[89],"computation":[90],"pipeline,":[91],"efficient":[93,128],"multiplication":[95],"between":[96],"unavailable.":[102],"In":[103],"this":[104],"article,":[105],"we":[106],"propose":[107],"TAB":[108,123,267,298],"as":[109,212,220,228,275,277,302],"optimized":[113],"inference":[114],"method":[115,216],"ternary,":[117],"binary,":[118],"neural":[121],"networks.":[122],"includes":[124],"value":[126,147],"representation,":[127],"storage":[130,252],"scheme":[131],"novel":[133],"bitwise":[134,184],"dot":[135,185],"product":[136,186],"pipelines":[137,187],"CPU/GPU":[139],"We":[141,154,178],"adopt":[142],"signed":[143],"integers":[144],"consistent":[146],"representation":[148],"across":[149],"values.":[153],"introduce":[155],"bitwidth-last":[157],"format":[159],"that":[160,205,241],"stores":[161],"first":[163],"second":[165],"bits":[166],"separately":[171],"remove":[173],"bit":[175],"extraction":[176],"design":[179],"based":[188],"Gated-XOR":[190],"using":[191],"up":[192,246,269,281],"40%":[194],"fewer":[195],"operations":[196],"than":[197,289],"State-Of-The-Art":[198],"(SOTA)":[199],"methods.":[200],"Theoretical":[201],"speedup":[202,249],"analysis":[203],"shows":[204],"our":[206,242],"proposed":[207],"TAB-TNN":[208,243,279],"2.3\u00d7":[210],"fast":[211,219,227,276],"SOTA":[214],"RTN,":[217],"9.8\u00d7":[218],"8-bit":[221],"integer":[222],"quantization":[223],"(INT8),":[224],"39.4\u00d7":[226],"32-bit":[229],"full-precision":[230],"convolution":[231],"(FP32).":[232],"Experiment":[233],"results":[234],"platforms":[239],"show":[240],"has":[244],"achieved":[245],"34.6\u00d7":[248],"16\u00d7":[251],"size":[253],"reduction":[254],"with":[256,310],"FP32":[257],"layers.":[258],"TBN,":[259],"Binary-activation":[260],"Ternary-weight":[261],"Network":[262],"(BTN),":[263],"BNN":[265],"are":[268],"40.7\u00d7,":[271],"56.2\u00d7,":[272],"72.2\u00d7":[274],"FP32.":[278],"70.1%":[283],"faster":[284],"12.8%":[286],"more":[287],"power-efficient":[288],"RTN":[290],"Darknet-19":[292],"keeping":[294],"same":[296],"accuracy.":[297],"open":[300],"source":[301],"PyTorch":[304],"Extension":[305],"1":[306],"easy":[308],"integration":[309],"CNN":[312],"models.":[313]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-19T08:33:51.333923","created_date":"2025-10-10T00:00:00"}
