@article{lee-etal-2025-tale, title = "{TALE}: Token-Adaptive Low-Rank {KVC}ache Approximation with Reconstruction Elimination", author = "Lee, Jaeseong and Hwang, Seung-won and Qiao, Aurick and Campos, Daniel and Yao, Zhewei and He, Yuxiong", journal = "Transactions of the Association for Computational Linguistics", volume = "13", year = "2025", address = "Cambridge, MA", publisher = "MIT Press", url = "https://aclanthology.org/2025.tacl-1.59/", doi = "10.1162/tacl.a.39", pages = "1298--1318" }