{"id":"https://openalex.org/W7134943437","doi":"https://doi.org/10.48550/arxiv.2603.09576","title":"Routing without Forgetting","display_name":"Routing without Forgetting","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134943437","doi":"https://doi.org/10.48550/arxiv.2603.09576"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09576","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09576","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09576","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120450541","display_name":"Alessio Masano","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Masano, Alessio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083136342","display_name":"Giovanni Bellitto","orcid":"https://orcid.org/0000-0002-1333-8348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bellitto, Giovanni","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128747623","display_name":"Dipam Goswani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goswani, Dipam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128792333","display_name":"Joost Van de Weijer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Van de Weijer, Joost","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5075815307","display_name":"Concetto Spampinato","orcid":"https://orcid.org/0000-0001-6653-2577"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spampinato, Concetto","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5120450541"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9587000012397766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9587000012397766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.013100000098347664,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.002899999963119626,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.6513000130653381},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6187000274658203},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.48429998755455017},{"id":"https://openalex.org/keywords/associative-property","display_name":"Associative property","score":0.42809998989105225},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4253999888896942},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4214000105857849},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.38690000772476196},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.3840999901294708},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.3758000135421753}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7325999736785889},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.6513000130653381},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6187000274658203},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C159423971","wikidata":"https://www.wikidata.org/wiki/Q177251","display_name":"Associative property","level":2,"score":0.42809998989105225},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4253999888896942},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4214000105857849},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4090000092983246},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.38690000772476196},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3840999901294708},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.3758000135421753},{"id":"https://openalex.org/C53442348","wikidata":"https://www.wikidata.org/wiki/Q745101","display_name":"Content-addressable memory","level":3,"score":0.3675000071525574},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3594000041484833},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.35920000076293945},{"id":"https://openalex.org/C184896649","wikidata":"https://www.wikidata.org/wiki/Q290066","display_name":"Routing table","level":4,"score":0.34470000863075256},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.3303000032901764},{"id":"https://openalex.org/C40506919","wikidata":"https://www.wikidata.org/wiki/Q7452469","display_name":"Sequence learning","level":2,"score":0.3253999948501587},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32409998774528503},{"id":"https://openalex.org/C2778618852","wikidata":"https://www.wikidata.org/wiki/Q1128613","display_name":"Content-addressable storage","level":4,"score":0.3075000047683716},{"id":"https://openalex.org/C46421273","wikidata":"https://www.wikidata.org/wiki/Q1407668","display_name":"Hopfield network","level":3,"score":0.3043000102043152},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2996000051498413},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.2851000130176544},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2766999900341034},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.27079999446868896},{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C89305328","wikidata":"https://www.wikidata.org/wiki/Q1755411","display_name":"Link-state routing protocol","level":4,"score":0.2621999979019165},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C157972887","wikidata":"https://www.wikidata.org/wiki/Q463359","display_name":"Convex optimization","level":3,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09576","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09576","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09576","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09576","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7392132878303528,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Continual":[0,41],"learning":[1,62,186],"in":[2,26,39,63,184],"transformers":[3,64],"is":[4],"commonly":[5],"addressed":[6],"through":[7,124],"parameter-efficient":[8],"adaptation:":[9],"prompts,":[10,119],"adapters,":[11],"or":[12,89,116],"LoRA":[13],"modules":[14],"are":[15],"specialized":[16],"per":[17],"task":[18,87],"while":[19],"the":[20,73,78,129,139,198],"backbone":[21,200],"remains":[22],"frozen.":[23],"Although":[24],"effective":[25,205],"controlled":[27],"multi-epoch":[28],"settings,":[29],"these":[30],"approaches":[31,178],"rely":[32],"on":[33],"gradual":[34],"gradient-based":[35],"specialization":[36],"and":[37,51,172,204],"struggle":[38],"Online":[40],"Learning":[42],"(OCL),":[43],"where":[44],"data":[45],"arrive":[46],"as":[47,65],"a":[48,66,99,143,180,202],"non-stationary":[49],"stream":[50],"each":[52,83,134,152],"sample":[53],"may":[54],"be":[55],"observed":[56],"only":[57],"once.":[58],"We":[59,92],"recast":[60],"continual":[61],"routing":[67,150,195],"problem:":[68],"under":[69],"strict":[70],"online":[71],"constraints,":[72],"model":[74],"must":[75],"dynamically":[76],"select":[77],"appropriate":[79],"representational":[80],"subspace":[81],"for":[82,207],"input":[84],"without":[85,96],"explicit":[86],"identifiers":[88],"repeated":[90],"optimization.":[91],"thus":[93],"introduce":[94],"Routing":[95],"Forgetting":[97],"(RwF),":[98],"transformer":[100,130,199],"architecture":[101],"augmented":[102],"with":[103],"energy-based":[104,193],"associative":[105,126,194],"retrieval":[106,127],"layers":[107],"inspired":[108],"by":[109,179],"Modern":[110],"Hopfield":[111],"Networks.":[112],"Instead":[113],"of":[114,142,156],"storing":[115],"merging":[117],"task-specific":[118],"RwF":[120,164,174],"generates":[121],"dynamic":[122],"prompts":[123],"single-step":[125],"over":[128,166],"token":[131],"embeddings":[132],"at":[133],"layer.":[135],"Retrieval":[136],"corresponds":[137],"to":[138],"closed-form":[140],"minimization":[141],"strictly":[144],"convex":[145],"free-energy":[146],"functional,":[147],"enabling":[148],"input-conditioned":[149],"within":[151,197],"forward":[153],"pass,":[154],"independently":[155],"iterative":[157],"gradient":[158],"refinement.":[159],"Across":[160],"challenging":[161],"class-incremental":[162],"benchmarks,":[163],"improves":[165],"existing":[167],"prompt-based":[168,177],"methods.":[169],"On":[170],"Split-ImageNet-R":[171],"Split-ImageNet-S,":[173],"outperforms":[175],"prior":[176],"large":[181],"margin,":[182],"even":[183],"few-shot":[185],"regimes.":[187],"These":[188],"results":[189],"indicate":[190],"that":[191],"embedding":[192],"directly":[196],"provides":[201],"principled":[203],"foundation":[206],"OCL.":[208]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-12T00:00:00"}
