@inproceedings{aji-heafield-2020-compressing, title = "Compressing Neural Machine Translation Models with 4-bit Precision", author = "Aji, Alham Fikri and Heafield, Kenneth", editor = "Birch, Alexandra and Finch, Andrew and Hayashi, Hiroaki and Heafield, Kenneth and Junczys-Dowmunt, Marcin and Konstas, Ioannis and Li, Xian and Neubig, Graham and Oda, Yusuke", booktitle = "Proceedings of the Fourth Workshop on Neural Generation and Translation", month = jul, year = "2020", address = "Online", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2020.ngt-1.4/", doi = "10.18653/v1/2020.ngt-1.4", pages = "35--42" }