{"id":"https://openalex.org/W4379933301","doi":"https://doi.org/10.1145/3580305.3599897","title":"Revisiting Neural Retrieval on Accelerators","display_name":"Revisiting Neural Retrieval on Accelerators","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4379933301","doi":"https://doi.org/10.1145/3580305.3599897"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599897","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599897","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599897","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599897","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100349821","display_name":"Jiaqi Zhai","orcid":"https://orcid.org/0009-0004-7279-3318"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jiaqi Zhai","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004289205","display_name":"Z. Gong","orcid":"https://orcid.org/0009-0004-1761-7530"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhaojie Gong","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100741371","display_name":"Yueming Wang","orcid":"https://orcid.org/0009-0003-3581-8910"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yueming Wang","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101886784","display_name":"Xiao Sun","orcid":"https://orcid.org/0000-0002-8385-7020"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiao Sun","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100343287","display_name":"Yan Zheng","orcid":"https://orcid.org/0000-0002-9754-9264"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zheng Yan","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100324323","display_name":"Fu Li","orcid":"https://orcid.org/0009-0004-1141-0870"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fu Li","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100381490","display_name":"Xing Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xing Liu","raw_affiliation_strings":["Meta Platforms, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Meta Platforms, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100349821"],"corresponding_institution_ids":["https://openalex.org/I4210114444"],"apc_list":null,"apc_paid":null,"fwci":8.1827,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.97494821,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"5520","last_page":"5531"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7743083238601685},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6627546548843384},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6187268495559692},{"id":"https://openalex.org/keywords/dot-product","display_name":"Dot product","score":0.6123409271240234},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5774039030075073},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5657511949539185},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5217074751853943},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5141287446022034},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.4817885756492615},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.46204277873039246},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.43600893020629883},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.4271582067012787},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3420169949531555},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10291793942451477}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7743083238601685},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6627546548843384},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6187268495559692},{"id":"https://openalex.org/C32900221","wikidata":"https://www.wikidata.org/wiki/Q181365","display_name":"Dot product","level":2,"score":0.6123409271240234},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5774039030075073},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5657511949539185},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5217074751853943},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5141287446022034},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.4817885756492615},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.46204277873039246},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.43600893020629883},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.4271582067012787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3420169949531555},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10291793942451477},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3580305.3599897","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599897","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599897","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2306.04039","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.04039","pdf_url":"https://arxiv.org/pdf/2306.04039","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3580305.3599897","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599897","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599897","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4379933301.pdf","grobid_xml":"https://content.openalex.org/works/W4379933301.grobid-xml"},"referenced_works_count":62,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1852777783","https://openalex.org/W1978475816","https://openalex.org/W2002555321","https://openalex.org/W2010416066","https://openalex.org/W2093270024","https://openalex.org/W2137983211","https://openalex.org/W2150884987","https://openalex.org/W2163605009","https://openalex.org/W2169054943","https://openalex.org/W2171034893","https://openalex.org/W2295739661","https://openalex.org/W2475334473","https://openalex.org/W2512971201","https://openalex.org/W2548339725","https://openalex.org/W2548570154","https://openalex.org/W2559655401","https://openalex.org/W2597851033","https://openalex.org/W2604662567","https://openalex.org/W2605350416","https://openalex.org/W2605800822","https://openalex.org/W2606722458","https://openalex.org/W2610550445","https://openalex.org/W2723293840","https://openalex.org/W2763421725","https://openalex.org/W2770285862","https://openalex.org/W2783666221","https://openalex.org/W2896457183","https://openalex.org/W2917898551","https://openalex.org/W2937556626","https://openalex.org/W2962834855","https://openalex.org/W2963367478","https://openalex.org/W2963537482","https://openalex.org/W2963601856","https://openalex.org/W2963921057","https://openalex.org/W2964052347","https://openalex.org/W2964182926","https://openalex.org/W2970821029","https://openalex.org/W2972132054","https://openalex.org/W2982902390","https://openalex.org/W2982930951","https://openalex.org/W2984100107","https://openalex.org/W2987999026","https://openalex.org/W2998702515","https://openalex.org/W3023045848","https://openalex.org/W3034853385","https://openalex.org/W3036320503","https://openalex.org/W3037556679","https://openalex.org/W3088777230","https://openalex.org/W3098468692","https://openalex.org/W3106181667","https://openalex.org/W3116048950","https://openalex.org/W3118280765","https://openalex.org/W3153940464","https://openalex.org/W3171249018","https://openalex.org/W3185773347","https://openalex.org/W3201149665","https://openalex.org/W3209710210","https://openalex.org/W4250531751","https://openalex.org/W4283767616","https://openalex.org/W4297812065","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2368605798","https://openalex.org/W2518037665","https://openalex.org/W2348524959","https://openalex.org/W2477036161","https://openalex.org/W2368049389","https://openalex.org/W2384861574","https://openalex.org/W4294565801","https://openalex.org/W2170801710","https://openalex.org/W2952704802","https://openalex.org/W2741781807"],"abstract_inverted_index":{"Retrieval":[0],"finds":[1],"a":[2,9,121,137,164],"small":[3],"number":[4],"of":[5,21,37,82,94,104,154],"relevant":[6],"candidates":[7],"from":[8],"large":[10,165],"corpus":[11,135],"for":[12],"information":[13],"retrieval":[14,22,75,123],"and":[15,67,79,111,174,183],"recommendation":[16,166],"applications.":[17],"A":[18],"key":[19],"component":[20],"is":[23,30,101],"to":[24,114,129,133,143,152,156],"model":[25],"(user,":[26,87,108],"item)":[27,88,109],"similarity,":[28],"which":[29,64,85],"commonly":[31,46],"represented":[32],"as":[33,48,90],"the":[34,115,179],"dot":[35,57],"product":[36],"two":[38],"learned":[39],"embeddings.":[40],"This":[41,98],"formulation":[42,100],"permits":[43],"efficient":[44],"inference,":[45],"known":[47],"Maximum":[49],"Inner":[50],"Product":[51],"Search":[52],"(MIPS).":[53],"Despite":[54],"its":[55],"popularity,":[56],"products":[58],"cannot":[59],"capture":[60],"complex":[61],"user-item":[62],"interactions,":[63,110],"are":[65,127],"multifaceted":[66],"likely":[68],"high":[69,106],"rank.":[70],"We":[71],"hence":[72],"examine":[73],"non-dot-product":[74],"settings":[76],"on":[77,136,163],"accelerators,":[78],"propose":[80],"mixture":[81],"logits":[83],"(MoL),":[84],"models":[86],"similarity":[89,96],"an":[91],"adaptive":[92],"composition":[93],"elementary":[95],"functions.":[97],"new":[99],"expressive,":[102],"capable":[103],"modeling":[105],"rank":[107],"further":[112],"generalizes":[113],"long":[116],"tail.":[117],"When":[118],"combined":[119],"with":[120,140],"hierarchical":[122],"strategy,":[124],"h-indexer,":[125],"we":[126],"able":[128],"scale":[130],"up":[131,155],"MoL":[132],"100M":[134],"single":[138],"GPU":[139],"latency":[141],"comparable":[142],"MIPS":[144],"baselines.":[145],"On":[146],"public":[147],"datasets,":[148],"our":[149],"approach":[150],"leads":[151],"uplifts":[153],"77.3%":[157],"in":[158],"hit":[159],"rate":[160],"(HR).":[161],"Experiments":[162],"surface":[167],"at":[168],"Meta":[169],"showed":[170],"strong":[171],"metric":[172],"gains":[173],"reduced":[175],"popularity":[176],"bias,":[177],"validating":[178],"proposed":[180],"approach's":[181],"performance":[182],"improved":[184],"generalization.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-06T07:47:59.780226","created_date":"2025-10-10T00:00:00"}
