@Article{Raposo2024MixtureofDepthsDA,
author = {David Raposo and Sam Ritter and Blake Richards and T. Lillicrap and Peter Humphreys and Adam Santoro},
booktitle = {arXiv.org},
journal = {ArXiv},
title = {Mixture-of-Depths: Dynamically allocating compute in transformer-based language models},
volume = {abs/2404.02258},
year = {2024}
}