{"id":"https://openalex.org/W4410553153","doi":"https://doi.org/10.23919/date64628.2025.10993280","title":"Segment-Wise Accumulation: Low-Error Logarithmic Domain Computing for Efficient Large Language Model Inference","display_name":"Segment-Wise Accumulation: Low-Error Logarithmic Domain Computing for Efficient Large Language Model Inference","publication_year":2025,"publication_date":"2025-03-31","ids":{"openalex":"https://openalex.org/W4410553153","doi":"https://doi.org/10.23919/date64628.2025.10993280"},"language":"en","primary_location":{"id":"doi:10.23919/date64628.2025.10993280","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10993280","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059647894","display_name":"Xinkuang Geng","orcid":"https://orcid.org/0000-0003-3673-237X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinkuang Geng","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101497811","display_name":"Yunjie Lu","orcid":"https://orcid.org/0000-0003-3143-3581"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunjie Lu","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100460715","display_name":"Hui Wang","orcid":"https://orcid.org/0000-0001-9618-0955"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Wang","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019717600","display_name":"Honglan Jiang","orcid":"https://orcid.org/0000-0003-3705-4240"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Honglan Jiang","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5059647894"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05633698,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9527000188827515,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7545769214630127},{"id":"https://openalex.org/keywords/logarithm","display_name":"Logarithm","score":0.7334437966346741},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6739257574081421},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.48146072030067444},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4610174894332886},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.42225009202957153},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.39538607001304626},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27747589349746704},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15244603157043457}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7545769214630127},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.7334437966346741},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6739257574081421},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.48146072030067444},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4610174894332886},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.42225009202957153},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39538607001304626},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27747589349746704},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15244603157043457},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/date64628.2025.10993280","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10993280","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8355552838","display_name":null,"funder_award_id":"62374108","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2045146697","https://openalex.org/W2052942864","https://openalex.org/W2053987390","https://openalex.org/W2111013824","https://openalex.org/W2165689099","https://openalex.org/W2442974303","https://openalex.org/W2694935213","https://openalex.org/W2899818272","https://openalex.org/W3081943686","https://openalex.org/W4285264221","https://openalex.org/W4385245566","https://openalex.org/W4399487307","https://openalex.org/W6756007670","https://openalex.org/W6796815506","https://openalex.org/W6811340617","https://openalex.org/W6847478871","https://openalex.org/W6854866820"],"related_works":["https://openalex.org/W2055243143","https://openalex.org/W2046736294","https://openalex.org/W4401442391","https://openalex.org/W2980815195","https://openalex.org/W48199998","https://openalex.org/W1519526186","https://openalex.org/W2260200182","https://openalex.org/W4293584968","https://openalex.org/W2384758770","https://openalex.org/W2032964960"],"abstract_inverted_index":{"Logarithmic":[0],"domain":[1,166],"computing":[2],"(LDC)":[3],"has":[4],"great":[5],"potential":[6],"for":[7,89],"reducing":[8],"quantization":[9],"errors":[10,53],"and":[11,184],"computational":[12],"complexity":[13],"in":[14,32,55,78,104,123,153,160,182,186],"Large":[15],"Language":[16],"Models":[17],"(LLMs).":[18],"While":[19],"logarithmic":[20,41,169],"multiplication":[21],"can":[22],"be":[23],"efficiently":[24],"implemented":[25],"using":[26],"fixed-point":[27],"addition,":[28,68],"the":[29,38,52,79,85,93,97,132,175],"primary":[30],"challenge":[31],"multiply-accumulate":[33],"(MAC)":[34],"operations":[35],"is":[36,73],"balancing":[37],"precision":[39,133],"of":[40,51,134,180],"adders":[42],"with":[43,84],"their":[44],"hardware":[45,106,127,143],"overhead.":[46,107],"Through":[47],"a":[48,69,141,168],"detailed":[49],"analysis":[50],"inherent":[54],"LDC-based":[56],"LLMs,":[57,124],"we":[58],"propose":[59],"segment-wise":[60],"accumulation":[61,86],"(SWA)":[62],"to":[63,75,119,164],"mitigate":[64],"these":[65],"errors.":[66],"In":[67],"processing":[70,170],"element":[71,171],"(PE)":[72],"introduced":[74],"enable":[76],"SWA":[77,95,113,177],"systolic":[80],"array":[81,172],"architecture.":[82],"Compared":[83],"scheme":[87],"devised":[88],"enhancing":[90],"floating-point":[91],"computing,":[92,167],"proposed":[94,176],"facilitates":[96],"integration":[98],"into":[99],"existing":[100],"accelerator":[101],"architectures,":[102],"resulting":[103],"lower":[105,142],"The":[108],"experimental":[109],"results":[110],"show":[111],"that":[112],"allows":[114],"LDC":[115],"under":[116],"low-precision":[117],"configurations":[118],"achieve":[120],"remarkable":[121],"accuracy":[122,155],"demonstrating":[125],"higher":[126,190],"efficiency":[128],"than":[129,145,150],"merely":[130],"increasing":[131],"individual":[135],"computations.":[136],"Our":[137],"method,":[138],"while":[139,188],"maintaining":[140],"overhead":[144],"traditional":[146],"LDC,":[147],"achieves":[148],"more":[149],"13.9%":[151],"improvement":[152],"average":[154],"across":[156],"multiple":[157],"zero-shot":[158],"benchmarks":[159],"LLAMA-2-7B.":[161],"Furthermore,":[162],"compared":[163],"integer":[165],"based":[173],"on":[174],"yields":[178],"reductions":[179],"24.6%":[181],"area":[183],"42.3%":[185],"power,":[187],"achieving":[189],"accuracy.":[191]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
