{"id":"https://openalex.org/W7160888903","doi":"https://doi.org/10.48550/arxiv.2605.10886","title":"LoKA: Low-precision Kernel Applications for Recommendation Models At Scale","display_name":"LoKA: Low-precision Kernel Applications for Recommendation Models At Scale","publication_year":2026,"publication_date":"2026-05-11","ids":{"openalex":"https://openalex.org/W7160888903","doi":"https://doi.org/10.48550/arxiv.2605.10886"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.10886","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10886","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.10886","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135935499","display_name":"Liang Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078483147","display_name":"Yinbin Ma","orcid":"https://orcid.org/0000-0002-9511-6596"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yinbin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114402062","display_name":"Quanyu Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Quanyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135978184","display_name":"Vasiliy Kuznetsov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuznetsov, Vasiliy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135980075","display_name":"Yuxin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yuxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135984158","display_name":"Jian Jiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiao, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008163714","display_name":"Jiecao Yu","orcid":"https://orcid.org/0000-0003-2085-0312"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jiecao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047533043","display_name":"Buyun Zhang","orcid":"https://orcid.org/0009-0007-9053-4661"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Buyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073055431","display_name":"Tongyi Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Tongyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101806339","display_name":"Xiaohan Wei","orcid":"https://orcid.org/0000-0001-9997-0469"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Xiaohan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135958259","display_name":"Yanli Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yanli","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135958296","display_name":"Zeliang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zeliang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135977557","display_name":"Yuchen Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Yuchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135928294","display_name":"Venkatesh Ranganathan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ranganathan, Venkatesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135914779","display_name":"Sandeep Parab","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parab, Sandeep","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135992860","display_name":"Yantao Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Yantao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066701229","display_name":"M. Yu. Naumov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naumov, Maxim","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135917154","display_name":"Chunzhi Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Chunzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135986692","display_name":"Shen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007535563","display_name":"Ellie Wen","orcid":"https://orcid.org/0000-0001-8229-2294"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Ellie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135999623","display_name":"Wenlin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Wenlin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050340255","display_name":"Santanu Kolay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kolay, Santanu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070094618","display_name":"Chunqiang Tang","orcid":"https://orcid.org/0009-0004-0133-4800"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Chunqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":23,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.2003999948501587,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.2003999948501587,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.09669999778270721,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.0625,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.8046000003814697},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.7577999830245972},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6434000134468079},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5544999837875366},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5331000089645386},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.4562999904155731},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4375999867916107}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.8046000003814697},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.7577999830245972},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6636999845504761},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6434000134468079},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5544999837875366},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5331000089645386},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.4562999904155731},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4375999867916107},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4278999865055084},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4052000045776367},{"id":"https://openalex.org/C122280245","wikidata":"https://www.wikidata.org/wiki/Q620622","display_name":"Kernel method","level":3,"score":0.3646000027656555},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.35120001435279846},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33640000224113464},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3215999901294708},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.2874000072479248},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C71134354","wikidata":"https://www.wikidata.org/wiki/Q458825","display_name":"Kernel density estimation","level":3,"score":0.26980000734329224},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.2637999951839447}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.10886","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10886","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.10886","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10886","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"GPU":[1],"generations":[2],"deliver":[3],"significantly":[4],"higher":[5],"FLOPs":[6],"using":[7],"lower-precision":[8],"arithmetic,":[9],"such":[10],"as":[11],"FP8.":[12,92,192],"While":[13],"successfully":[14,90],"applied":[15],"to":[16,55,69,89,114,126,137,206],"large":[17,24],"language":[18],"models":[19,26],"(LLMs),":[20],"its":[21],"adoption":[22],"in":[23,49],"recommendation":[25],"(LRMs)":[27],"has":[28],"been":[29],"limited.":[30],"This":[31,161],"is":[32,87,119,130,144,176,195],"because":[33],"LRMs":[34,56,106],"are":[35,67],"numerically":[36],"sensitive,":[37],"dominated":[38],"by":[39,45,77],"small":[40],"matrix":[41],"multiplications":[42],"(GEMMs)":[43],"followed":[44],"normalization,":[46],"and":[47,61,72,132,154,157,165,168,188],"trained":[48],"communication-intensive":[50],"environments.":[51],"Applying":[52],"FP8":[53,80,103,172,210],"directly":[54],"often":[57],"degrades":[58],"model":[59,122,181],"quality":[60],"prolongs":[62],"training":[63],"time.":[64],"These":[65],"challenges":[66],"inherent":[68],"LRM":[70],"workloads":[71],"cannot":[73],"be":[74],"resolved":[75],"merely":[76],"introducing":[78],"better":[79],"kernels.":[81],"Instead,":[82],"a":[83,99,145,177,196],"system-model":[84],"co-design":[85,121],"approach":[86],"needed":[88],"integrate":[91],"We":[93],"present":[94],"LoKA":[95,142,174,193,204],"(Low-precision":[96],"Kernel":[97],"Applications),":[98],"framework":[100],"that":[101,151,183,198,212],"makes":[102],"practical":[104],"for":[105,171],"through":[107],"three":[108],"principles:":[109],"profile":[110],"under":[111],"realistic":[112],"distributions":[113],"know":[115],"where":[116,128],"low":[117],"precision":[118],"safe,":[120,131],"components":[123],"with":[124,191],"hardware":[125],"expand":[127],"it":[129],"orchestrate":[133],"across":[134],"kernel":[135,211],"libraries":[136],"maximize":[138],"the":[139,200,208,214],"gains.":[140],"Concretely,":[141],"Probe":[143,205],"statistically":[146],"grounded,":[147],"online":[148],"benchmarking":[149],"method":[150],"learns":[152],"activation":[153],"weight":[155],"statistics,":[156],"quantifies":[158],"per-layer":[159],"errors.":[160],"process":[162],"pinpoints":[163],"safe":[164],"unsafe,":[166],"fast":[167],"slow":[169],"sites":[170],"adoption.":[173],"Mods":[175],"set":[178],"of":[179],"reusable":[180],"adaptations":[182],"improve":[184],"both":[185],"numerical":[186],"stability":[187],"execution":[189],"efficiency":[190],"Dispatch":[194],"runtime":[197],"leverages":[199],"statistical":[201],"insights":[202],"from":[203],"select":[207],"fastest":[209],"satisfies":[213],"accuracy":[215],"requirements.":[216]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
