{"id":"https://openalex.org/W4220884018","doi":"https://doi.org/10.1145/3492321.3519554","title":"Fleche","display_name":"Fleche","publication_year":2022,"publication_date":"2022-03-28","ids":{"openalex":"https://openalex.org/W4220884018","doi":"https://doi.org/10.1145/3492321.3519554"},"language":"en","primary_location":{"id":"doi:10.1145/3492321.3519554","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3492321.3519554","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3492321.3519554","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Seventeenth European Conference on Computer Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3492321.3519554","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101139637","display_name":"Minhui Xie","orcid":"https://orcid.org/0000-0001-6684-8336"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Minhui Xie","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052095173","display_name":"Youyou Lu","orcid":"https://orcid.org/0000-0002-6214-5390"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youyou Lu","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090269605","display_name":"Jiazhen Lin","orcid":"https://orcid.org/0009-0004-9377-2460"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiazhen Lin","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100434855","display_name":"Qing Wang","orcid":"https://orcid.org/0000-0002-7102-243X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Wang","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035259866","display_name":"Jian Gao","orcid":"https://orcid.org/0000-0002-0994-3430"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Gao","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046958624","display_name":"Kai Ren","orcid":"https://orcid.org/0000-0002-9312-9705"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kai Ren","raw_affiliation_strings":["Kuaishou"],"affiliations":[{"raw_affiliation_string":"Kuaishou","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101740783","display_name":"Jiwu Shu","orcid":"https://orcid.org/0000-0002-7362-2789"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiwu Shu","raw_affiliation_strings":["Kuaishou"],"affiliations":[{"raw_affiliation_string":"Kuaishou","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101139637"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":2.6398,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.9100459,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"402","last_page":"416"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8304311633110046},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.8196672201156616},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6413699388504028},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6194460988044739},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5466658473014832},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.5000894069671631},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.4921959936618805},{"id":"https://openalex.org/keywords/cache-invalidation","display_name":"Cache invalidation","score":0.4430113434791565},{"id":"https://openalex.org/keywords/cache-coloring","display_name":"Cache coloring","score":0.43684232234954834},{"id":"https://openalex.org/keywords/cache-oblivious-algorithm","display_name":"Cache-oblivious algorithm","score":0.4327140748500824},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4307194948196411},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4301775097846985},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.38934019207954407},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.21840029954910278},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.14050811529159546}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8304311633110046},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.8196672201156616},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6413699388504028},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6194460988044739},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5466658473014832},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.5000894069671631},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.4921959936618805},{"id":"https://openalex.org/C25536678","wikidata":"https://www.wikidata.org/wiki/Q5015977","display_name":"Cache invalidation","level":5,"score":0.4430113434791565},{"id":"https://openalex.org/C201148951","wikidata":"https://www.wikidata.org/wiki/Q5015976","display_name":"Cache coloring","level":4,"score":0.43684232234954834},{"id":"https://openalex.org/C59687516","wikidata":"https://www.wikidata.org/wiki/Q5015938","display_name":"Cache-oblivious algorithm","level":5,"score":0.4327140748500824},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4307194948196411},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4301775097846985},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.38934019207954407},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.21840029954910278},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.14050811529159546},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3492321.3519554","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3492321.3519554","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3492321.3519554","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Seventeenth European Conference on Computer Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3492321.3519554","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3492321.3519554","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3492321.3519554","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Seventeenth European Conference on Computer Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1124125120","display_name":null,"funder_award_id":"62022051","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3085993365","display_name":null,"funder_award_id":"(Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G323530312","display_name":null,"funder_award_id":"6183201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3472539505","display_name":null,"funder_award_id":"202205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5249178904","display_name":null,"funder_award_id":"Grant No. 6","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5805579215","display_name":null,"funder_award_id":"61832011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8281162173","display_name":null,"funder_award_id":"62022051, 61832011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4220884018.pdf","grobid_xml":"https://content.openalex.org/works/W4220884018.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W1493774699","https://openalex.org/W1966831051","https://openalex.org/W2054141820","https://openalex.org/W2060758175","https://openalex.org/W2074694452","https://openalex.org/W2147657366","https://openalex.org/W2157825442","https://openalex.org/W2263483768","https://openalex.org/W2475334473","https://openalex.org/W2548570154","https://openalex.org/W2605350416","https://openalex.org/W2723293840","https://openalex.org/W2793768763","https://openalex.org/W2898085636","https://openalex.org/W2962745591","https://openalex.org/W2964064024","https://openalex.org/W2964182926","https://openalex.org/W2984020950","https://openalex.org/W3101704389","https://openalex.org/W3104030692","https://openalex.org/W3153887672","https://openalex.org/W3166863226"],"related_works":["https://openalex.org/W2098406302","https://openalex.org/W2538519144","https://openalex.org/W2121191383","https://openalex.org/W2076114130","https://openalex.org/W1584415117","https://openalex.org/W2046128376","https://openalex.org/W1863436361","https://openalex.org/W1860107648","https://openalex.org/W57688818","https://openalex.org/W1965891727"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"based":[2],"models":[3],"have":[4],"dominated":[5],"current":[6],"production":[7],"recommendation":[8],"systems.":[9],"However,":[10],"the":[11,39,43,83,99,113,128,134],"gap":[12],"between":[13],"CPU-side":[14],"DRAM":[15],"data":[16],"accessing":[17],"and":[18,87,107,143],"GPU":[19,51],"processing":[20],"still":[21],"impedes":[22],"their":[23],"inference":[24,151],"performance.":[25],"GPU-resident":[26,68],"cache":[27,42,61,75,85,114],"can":[28],"bridge":[29],"this":[30,54],"gap,":[31],"but":[32],"we":[33,56,110],"find":[34],"that":[35,125],"existing":[36],"systems":[37],"leave":[38],"benefits":[40],"to":[41,81,97,146],"embedding":[44,69,79,137],"table,":[45],"a":[46,59],"huge":[47],"sparse":[48],"structure,":[49],"on":[50],"unexploited.":[52],"In":[53],"paper,":[55],"present":[57],"Fleche,":[58],"holistic":[60],"scheme":[62],"with":[63,121,127],"detailed":[64],"designs":[65],"for":[66,77,117],"efficient":[67],"caching.":[70],"Fleche":[71,131],"(1)":[72],"uses":[73],"one":[74,94],"backend":[76],"all":[78],"tables":[80],"improve":[82],"total":[84],"utilization,":[86],"(2)":[88],"merges":[89],"small":[90],"kernel":[91,102,105],"calls":[92],"into":[93],"unitary":[95],"call":[96],"reduce":[98],"overhead":[100],"of":[101,136,149],"maintenance":[103],"(e.g.,":[104],"launching":[106],"synchronizing).":[108],"Furthermore,":[109],"carefully":[111],"design":[112],"query":[115],"workflow":[116],"finer-grain":[118],"parallelism.":[119],"Evaluations":[120],"real-world":[122],"datasets":[123],"show":[124],"compared":[126],"prior":[129],"art,":[130],"significantly":[132],"improves":[133],"throughput":[135],"layer":[138],"by":[139],"2.0":[140],"--":[141],"5.4\u00d7,":[142],"gets":[144],"up":[145],"2.4\u00d7":[147],"speedup":[148],"end-to-end":[150],"throughput.":[152]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":6}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2022-04-03T00:00:00"}
