@inproceedings{gupta-etal-2021-memory, title = "Memory-efficient Transformers via Top-k Attention", author = "Gupta, Ankit and Dar, Guy and Goodman, Shaya and Ciprut, David and Berant, Jonathan", editor = "Moosavi, Nafise Sadat and Gurevych, Iryna and Fan, Angela and Wolf, Thomas and Hou, Yufang and Marasovi{\'c}, Ana and Ravi, Sujith", booktitle = "Proceedings of the Second Workshop on Simple and Efficient Natural Language Processing", month = nov, year = "2021", address = "Virtual", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2021.sustainlp-1.5/", doi = "10.18653/v1/2021.sustainlp-1.5", pages = "39--52" }