@inproceedings{sun-etal-2024-decoding, title = "Decoding at the Speed of Thought: Harnessing Parallel Decoding of Lexical Units for {LLM}s", author = "Sun, Chenxi and Zhang, Hongzhi and Lin, Zijia and Zhang, Jingyuan and Zhang, Fuzheng and Wang, Zhongyuan and Chen, Bin and Song, Chengru and Zhang, Di and Gai, Kun and Xiong, Deyi", editor = "Calzolari, Nicoletta and Kan, Min-Yen and Hoste, Veronique and Lenci, Alessandro and Sakti, Sakriani and Xue, Nianwen", booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)", month = may, year = "2024", address = "Torino, Italia", publisher = "ELRA and ICCL", url = "https://aclanthology.org/2024.lrec-main.401/", pages = "4476--4487" }