@inproceedings{Zhenmei-gem,
author = {Zhenmei Shi and Yifei Ming and Xuan-Phi Nguyen and Yingyu Liang, and Shafiq Joty},
booktitle = {Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics},
series = {ACL-26 Findings},
title = {Discovering the Gems in Early Layers: Accelerating Long-Context LLMs with 1000x Input Token Reduction},
url = {https://arxiv.org/abs/2409.17422},
year = {2026}
}