@article{de2024griffin,
title={Griffin: Mixing gated linear recurrences with local attention for efficient language models},
author={De, Soham and Smith, Samuel L and Fernando, Anushan and Botev, Aleksandar and Cristian-Muraru, George and Gu, Albert and Haroun, Ruba and Berrada, Leonard and Chen, Yutian and Srinivasan, Srivatsan and others},
journal={arXiv preprint arXiv:2402.19427},
year={2024}
}