@article{kim2026fast, title={Fast KVzip: Efficient and Accurate LLM Inference with Gated KV Eviction}, author={Kim, Jang-Hyun and Han, Dongyoon and Yun, Sangdoo}, journal={arXiv preprint arXiv:2601.17668}, year={2026} }