license: apache-2.0 | |
[MambaInLlama](arxiv.org/abs/2408.15237) | |
``` | |
@article{junxiongdaniele2024mambainllama, | |
title = {The Mamba in the Llama: Distilling and Accelerating Hybrid Models}, | |
author = {Junxiong Wang and Daniele Paliotta and Avner May and Alexander M. Rush and Tri Dao}, | |
journal = {arXiv preprint arXiv:2408.15237}, | |
year = {2024} | |
} | |
``` |