{"id":"https://openalex.org/W7101582257","doi":"https://doi.org/10.48550/arxiv.2510.21908","title":"Enabling Robust In-Context Memory and Rapid Task Adaptation in Transformers with Hebbian and Gradient-Based Plasticity","display_name":"Enabling Robust In-Context Memory and Rapid Task Adaptation in Transformers with Hebbian and Gradient-Based Plasticity","publication_year":2025,"publication_date":"2025-10-24","ids":{"openalex":"https://openalex.org/W7101582257","doi":"https://doi.org/10.48550/arxiv.2510.21908"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2510.21908","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21908","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2510.21908","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chaudhary, Siddharth","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chaudhary, Siddharth","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12660","display_name":"Plant Disease Management Techniques","score":0.12759999930858612,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12660","display_name":"Plant Disease Management Techniques","score":0.12759999930858612,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10771","display_name":"Wound Healing and Treatments","score":0.09719999879598618,"subfield":{"id":"https://openalex.org/subfields/2742","display_name":"Rehabilitation"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10729","display_name":"Electrospun Nanofibers in Biomedical Applications","score":0.09610000252723694,"subfield":{"id":"https://openalex.org/subfields/2502","display_name":"Biomaterials"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hebbian-theory","display_name":"Hebbian theory","score":0.9721999764442444},{"id":"https://openalex.org/keywords/plasticity","display_name":"Plasticity","score":0.7853000164031982},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.489300012588501},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4790000021457672},{"id":"https://openalex.org/keywords/leabra","display_name":"Leabra","score":0.40380001068115234},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.37709999084472656},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.36419999599456787}],"concepts":[{"id":"https://openalex.org/C111437709","wikidata":"https://www.wikidata.org/wiki/Q1277874","display_name":"Hebbian theory","level":3,"score":0.9721999764442444},{"id":"https://openalex.org/C79186407","wikidata":"https://www.wikidata.org/wiki/Q472074","display_name":"Plasticity","level":2,"score":0.7853000164031982},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6265000104904175},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4790000021457672},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4339999854564667},{"id":"https://openalex.org/C97108695","wikidata":"https://www.wikidata.org/wiki/Q6508265","display_name":"Leabra","level":5,"score":0.40380001068115234},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.36419999599456787},{"id":"https://openalex.org/C98229152","wikidata":"https://www.wikidata.org/wiki/Q1551556","display_name":"Synaptic plasticity","level":3,"score":0.3499999940395355},{"id":"https://openalex.org/C2779127903","wikidata":"https://www.wikidata.org/wiki/Q6510194","display_name":"Learning rule","level":3,"score":0.3366999924182892},{"id":"https://openalex.org/C159919123","wikidata":"https://www.wikidata.org/wiki/Q7577157","display_name":"Spike-timing-dependent plasticity","level":4,"score":0.329800009727478},{"id":"https://openalex.org/C86878447","wikidata":"https://www.wikidata.org/wiki/Q5266812","display_name":"Developmental plasticity","level":3,"score":0.32919999957084656},{"id":"https://openalex.org/C47611674","wikidata":"https://www.wikidata.org/wiki/Q849491","display_name":"Neuroplasticity","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.295199990272522},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26649999618530273}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2510.21908","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21908","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2510.21908","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21908","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5521637201309204,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"display":[3],"in-context":[4],"learning":[5],"as":[6],"an":[7],"emergent":[8],"effect":[9],"of":[10,67,120],"scale,":[11],"but":[12],"they":[13],"rely":[14],"on":[15,96],"static":[16,107],"weights":[17,108],"during":[18],"inference.":[19],"In":[20],"contrast,":[21],"biological":[22],"systems":[23],"continually":[24],"adapt":[25],"via":[26],"synaptic":[27],"plasticity.":[28],"We":[29],"investigate":[30],"whether":[31],"explicit,":[32],"biologically":[33],"inspired":[34],"plasticity":[35,65,82,117,134,147,159],"can":[36],"endow":[37],"Transformers":[38,49],"with":[39,50],"faster":[40],"in-sequence":[41],"adaptation.":[42],"To":[43],"this":[44],"end,":[45],"we":[46],"augment":[47],"decoder-only":[48],"fast-weight":[51],"modules":[52],"updated":[53],"either":[54],"by":[55,150],"(i)":[56],"a":[57,111],"neuromodulated":[58],"Hebbian":[59,81,133],"rule":[60],"or":[61],"(ii)":[62],"the":[63],"gradient-based":[64,92,126],"mechanism":[66],"Duan":[68],"et":[69],"al.":[70],"(2023).":[71],"Across":[72],"copying,":[73],"regression,":[74],"and":[75,87,104,155],"few-shot":[76,89],"classification":[77],"tasks":[78],"(CIFAR-FS,":[79],"Omniglot),":[80],"consistently":[83],"achieves":[84],"lower":[85],"loss":[86],"stronger":[88],"generalization,":[90],"while":[91],"updates":[93],"perform":[94],"best":[95],"long-horizon":[97],"credit":[98],"assignment.":[99],"When":[100],"associations":[101],"are":[102,161],"short":[103],"linearly":[105],"separable,":[106],"suffice,":[109],"defining":[110],"clear":[112],"boundary":[113],"condition":[114],"for":[115],"when":[116,157],"helps.":[118],"Analysis":[119],"learned":[121],"modulatory":[122],"signals":[123],"reveals":[124],"that":[125,145],"rules":[127],"maintain":[128],"large,":[129],"persistent":[130],"updates,":[131],"whereas":[132],"is":[135],"sharply":[136],"gated":[137],"around":[138],"salient":[139],"events.":[140],"Together,":[141],"these":[142],"results":[143],"show":[144],"explicit":[146],"complements":[148],"attention":[149],"enabling":[151],"rapid,":[152],"task-specific":[153],"adaptation,":[154],"clarify":[156],"different":[158],"mechanisms":[160],"most":[162],"effective.":[163]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-29T00:00:00"}
