{"id":"https://openalex.org/W4396988516","doi":"https://doi.org/10.1145/3639856.3639878","title":"Hetero-Rec++: Modelling-based Robust and Optimal Deployment of Embeddings Recommendations","display_name":"Hetero-Rec++: Modelling-based Robust and Optimal Deployment of Embeddings Recommendations","publication_year":2023,"publication_date":"2023-10-25","ids":{"openalex":"https://openalex.org/W4396988516","doi":"https://doi.org/10.1145/3639856.3639878"},"language":"en","primary_location":{"id":"doi:10.1145/3639856.3639878","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3639856.3639878","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Third International Conference on Artificial Intelligence and Machine Learning Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072133698","display_name":"Ashwin Krishnan","orcid":"https://orcid.org/0000-0002-8592-3132"},"institutions":[{"id":"https://openalex.org/I4210104194","display_name":"Tennessee Cancer Specialists","ror":"https://ror.org/01krbfc31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210104194"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashwin Krishnan","raw_affiliation_strings":["TCS Research, IN"],"raw_orcid":"https://orcid.org/0000-0002-8592-3132","affiliations":[{"raw_affiliation_string":"TCS Research, IN","institution_ids":["https://openalex.org/I4210104194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070564061","display_name":"Manoj Nambiar","orcid":"https://orcid.org/0000-0002-9001-0629"},"institutions":[{"id":"https://openalex.org/I4210104194","display_name":"Tennessee Cancer Specialists","ror":"https://ror.org/01krbfc31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210104194"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Manoj Nambiar","raw_affiliation_strings":["TCS, IN"],"raw_orcid":"https://orcid.org/0000-0002-9001-0629","affiliations":[{"raw_affiliation_string":"TCS, IN","institution_ids":["https://openalex.org/I4210104194"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086400313","display_name":"Rekha Singhal","orcid":"https://orcid.org/0000-0002-3712-1784"},"institutions":[{"id":"https://openalex.org/I4210104194","display_name":"Tennessee Cancer Specialists","ror":"https://ror.org/01krbfc31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210104194"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rekha Singhal","raw_affiliation_strings":["TCS, IN"],"raw_orcid":"https://orcid.org/0000-0002-3712-1784","affiliations":[{"raw_affiliation_string":"TCS, IN","institution_ids":["https://openalex.org/I4210104194"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4314,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.74436812,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8087173700332642},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.805996298789978},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.6702569723129272},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6492841839790344},{"id":"https://openalex.org/keywords/cas-latency","display_name":"CAS latency","score":0.5868165493011475},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5051320195198059},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.4707636833190918},{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.4584166407585144},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.45049160718917847},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.40156108140945435},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3256884813308716},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3249443769454956},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2717387080192566},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.18984049558639526},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.08090391755104065}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8087173700332642},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.805996298789978},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.6702569723129272},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6492841839790344},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.5868165493011475},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5051320195198059},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.4707636833190918},{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.4584166407585144},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.45049160718917847},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.40156108140945435},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3256884813308716},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3249443769454956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2717387080192566},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.18984049558639526},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.08090391755104065},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C100800780","wikidata":"https://www.wikidata.org/wiki/Q1175867","display_name":"Memory controller","level":3,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3639856.3639878","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3639856.3639878","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Third International Conference on Artificial Intelligence and Machine Learning Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2723293840","https://openalex.org/W2775287056","https://openalex.org/W2899457523","https://openalex.org/W2962745591","https://openalex.org/W2979719709","https://openalex.org/W3033065823","https://openalex.org/W3042495273","https://openalex.org/W3043433718","https://openalex.org/W3089344842","https://openalex.org/W3096737792","https://openalex.org/W3101707147","https://openalex.org/W3155243801","https://openalex.org/W3166863226","https://openalex.org/W3188766293","https://openalex.org/W3200211247","https://openalex.org/W3206393216","https://openalex.org/W4221074182","https://openalex.org/W4285361428","https://openalex.org/W4285703993","https://openalex.org/W4287643650","https://openalex.org/W4376852218","https://openalex.org/W4380881110"],"related_works":["https://openalex.org/W4293430534","https://openalex.org/W2342813629","https://openalex.org/W3150934690","https://openalex.org/W4297812927","https://openalex.org/W2335743642","https://openalex.org/W2800412005","https://openalex.org/W1976244802","https://openalex.org/W1992487929","https://openalex.org/W2083934844","https://openalex.org/W4386903460"],"abstract_inverted_index":{"Deep":[0],"Neural":[1],"Network":[2],"(DNN)-based":[3],"recommendation":[4],"models":[5,23],"(RMs)":[6],"are":[7,35],"widely":[8],"adopted":[9],"in":[10,57,72,119],"enterprise":[11],"applications":[12],"to":[13,20,37,53,62,84,89],"suggest":[14],"products,":[15],"videos,":[16],"tweets,":[17],"and":[18,34,94,107,126],"posts":[19],"users.":[21],"These":[22],"heavily":[24],"rely":[25],"on":[26,135],"embedding":[27,32,50,86,92],"tables,":[28,93],"which":[29],"contain":[30],"latent":[31],"vectors":[33],"accessed":[36,69],"evaluate":[38,95],"the":[39,49,64,80,96,121,129],"probability":[40],"of":[41,66,82,110],"user":[42],"interactions.":[43],"Recently":[44],"published,":[45],"Hetero-Rec":[46,83],"framework":[47],"leverages":[48],"access":[51],"history":[52],"allocate":[54],"storage":[55],"partitions":[56],"heterogeneous":[58,142],"memory":[59,143],"architecture,":[60],"aiming":[61],"maximize":[63],"chance":[65],"having":[67],"frequently":[68],"embeddings":[70],"available":[71],"faster":[73],"memory.":[74],"In":[75],"this":[76],"work,":[77],"we":[78,100,115],"extend":[79],"study":[81],"larger":[85],"tables":[87],"(up":[88],"350),":[90],"low-hot":[91],"end-to-end":[97],"speedups.":[98],"Consequently,":[99],"present":[101],"Hetro-Rec++":[102],"with":[103,141],"heuristic":[104],"based":[105],"pre-optimizer":[106],"advanced":[108],"formulation":[109],"optimizer\u2019s":[111],"cost":[112],"function.":[113],"Further,":[114],"demonstrate":[116],"its":[117],"effectiveness":[118],"reducing":[120],"embedding\u2019s":[122],"average":[123],"fetch":[124],"latency":[125,131],"hence,":[127],"improving":[128],"inference":[130],"for":[132],"RMs":[133],"deployed":[134],"Field":[136],"Programmable":[137],"Gate":[138],"Arrays":[139],"(FPGAs)":[140],"architectures.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
