@inproceedings{Zhenmei-gem,
address = {Arxiv},
author = {Zhenmei Shi and Yifei Ming and Xuan-Phi Nguyen and Yingyu Liang and Shafiq Joty},
publisher = {Arxiv},
series = {cs.CL},
title = {Discovering the Gems in Early Layers: Accelerating Long-Context LLMs with 1000x Input Token Reduction},
url = {https://arxiv.org/abs/2409.17422},
year = {2024}
}