@article{kim2026fastkvzip,
title={Fast KVzip: Efficient and Accurate LLM Inference with Gated KV Eviction},
author={Kim, Jang-Hyun and Han, Dongyoon and Yun, Sangdoo},
journal={arXiv preprint arXiv:2601.17668},
year={2026}}