Recurrent fast-weight memories and selective state-space models compress a growing context into a bounded state, their writes can therefore be viewed as online continual-learning rules.
Date: March 9, 2026
[Project Page] [Webpage] [Paper]

@article{zhang2026fast,
title = {Fast Weight Attention for Continual Learning},
author = {FWA Authors},
journal = {yifanzhang-pro.github.io},
year = {2026},
month = {March},
url = "https://github.com/yifanzhang-pro/fast-weight-attention"
}