{"id":"https://openalex.org/W7140316646","doi":"https://doi.org/10.48550/arxiv.2603.22325","title":"Hybrid Associative Memories","display_name":"Hybrid Associative Memories","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7140316646","doi":"https://doi.org/10.48550/arxiv.2603.22325"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22325","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130562396","display_name":"Leon Lufkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lufkin, Leon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052793754","display_name":"Tomas Figliolia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Figliolia, Tom\u00e1s","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048239223","display_name":"Beren Millidge","orcid":"https://orcid.org/0000-0003-1872-5635"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Millidge, Beren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130564279","display_name":"Kamesh Krishnamurthy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishnamurthy, Kamesh","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5130562396"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.32510000467300415,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.32510000467300415,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.06279999762773514,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.05469999834895134,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.8166999816894531},{"id":"https://openalex.org/keywords/interleaving","display_name":"Interleaving","score":0.682699978351593},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.548799991607666},{"id":"https://openalex.org/keywords/content-addressable-memory","display_name":"Content-addressable memory","score":0.5214999914169312},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.47290000319480896},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.45019999146461487},{"id":"https://openalex.org/keywords/associative-property","display_name":"Associative property","score":0.4478999972343445},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4007999897003174}],"concepts":[{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.8166999816894531},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8068000078201294},{"id":"https://openalex.org/C28034677","wikidata":"https://www.wikidata.org/wiki/Q17092530","display_name":"Interleaving","level":2,"score":0.682699978351593},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.548799991607666},{"id":"https://openalex.org/C53442348","wikidata":"https://www.wikidata.org/wiki/Q745101","display_name":"Content-addressable memory","level":3,"score":0.5214999914169312},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5069000124931335},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.47290000319480896},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.45019999146461487},{"id":"https://openalex.org/C159423971","wikidata":"https://www.wikidata.org/wiki/Q177251","display_name":"Associative property","level":2,"score":0.4478999972343445},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4007999897003174},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3871000111103058},{"id":"https://openalex.org/C120620853","wikidata":"https://www.wikidata.org/wiki/Q506355","display_name":"Bidirectional associative memory","level":4,"score":0.3287000060081482},{"id":"https://openalex.org/C2778618852","wikidata":"https://www.wikidata.org/wiki/Q1128613","display_name":"Content-addressable storage","level":4,"score":0.32409998774528503},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C2779602883","wikidata":"https://www.wikidata.org/wiki/Q15544750","display_name":"Memory architecture","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2766999900341034},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.25929999351501465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recurrent":[0],"neural":[1],"networks":[2],"(RNNs)":[3],"and":[4,59,74,87,126,204,220],"self-attention":[5,125],"are":[6,79],"both":[7],"widely":[8],"used":[9],"sequence-mixing":[10],"layers":[11,62,165],"that":[12,146,188,209],"maintain":[13],"an":[14],"internal":[15],"memory.":[16],"However,":[17],"this":[18,189],"memory":[19,73],"is":[20,147,155],"constructed":[21],"using":[22],"two":[23],"orthogonal":[24,57],"mechanisms:":[25],"RNNs":[26,78,127,219],"compress":[27],"the":[28,51,68,117,133,136,150,157,170,179,193],"entire":[29,137],"past":[30,40],"into":[31],"a":[32,182,199],"fixed-size":[33],"state,":[34],"whereas":[35],"self-attention's":[36],"state":[37,45],"stores":[38],"every":[39],"time":[41],"step":[42],"growing":[43],"its":[44],"(the":[46],"KV":[47,171,194],"cache)":[48],"linearly":[49],"with":[50,144,181,202],"sequence":[52],"length.":[53],"This":[54],"results":[55],"in":[56,67],"strengths":[58],"weaknesses.":[60],"Self-attention":[61],"excel":[63],"at":[64,223],"retrieving":[65],"information":[66,145,160],"context":[69],"but":[70,82],"have":[71],"large":[72],"computational":[75,107],"costs,":[76],"while":[77,128,139],"more":[80],"efficient":[81],"degrade":[83],"over":[84],"longer":[85],"contexts":[86],"underperform":[88],"for":[89,149],"precise":[90],"recall":[91],"tasks.":[92],"Prior":[93],"work":[94],"combining":[95],"these":[96],"mechanisms":[97],"has":[98,198],"focused":[99],"primarily":[100],"on":[101],"naively":[102],"interleaving":[103],"them":[104],"to":[105,111,152,161,218],"reduce":[106],"cost":[108],"without":[109],"regard":[110],"their":[112,130],"complementary":[113],"mechanisms.":[114],"We":[115,186],"propose":[116],"Hybrid":[118],"Associative":[119],"Memory":[120],"(HAM)":[121],"layer,":[122],"which":[123,154,173],"combines":[124],"leveraging":[129],"individual":[131],"strengths:":[132],"RNN":[134,151],"compresses":[135],"sequence,":[138],"attention":[140],"supplements":[141],"it":[142],"*only*":[143],"difficult":[148],"predict,":[153],"hence":[156],"most":[158],"valuable":[159],"explicitly":[162],"store.":[163],"HAM":[164],"enable":[166],"data-dependent":[167],"growth":[168,196],"of":[169,192],"cache,":[172],"can":[174],"be":[175],"precisely":[176],"controlled":[177],"by":[178],"user":[180],"single,":[183],"continuous":[184],"threshold.":[185],"find":[187],"fine-grained":[190],"control":[191],"cache":[195],"rate":[197],"smooth":[200],"trade-off":[201],"loss":[203],"performance.":[205],"Empirically,":[206],"we":[207],"show":[208],"our":[210],"hybrid":[211],"architecture":[212],"offers":[213],"strong,":[214],"competitive":[215],"performance":[216],"relative":[217],"Transformers":[221],"even":[222],"substantially":[224],"lower":[225],"KV-cache":[226],"usage.":[227]},"counts_by_year":[],"updated_date":"2026-03-26T06:10:45.909354","created_date":"2026-03-26T00:00:00"}
