@inproceedings{zhu-etal-2023-estimating, title = "Estimating the Likelihood of Words Being Known with Corpus Analysis and K-Means Clustering Algorithm", author = "Zhu, Tong and Irwin, Derek and Zhang, Yanhui and Wu, Renjie and Jiang, Xiaoyi", editor = "Huang, Chu-Ren and Harada, Yasunari and Kim, Jong-Bok and Chen, Si and Hsu, Yu-Yin and Chersoni, Emmanuele and A, Pranav and Zeng, Winnie Huiheng and Peng, Bo and Li, Yuxi and Li, Junlin", booktitle = "Proceedings of the 37th Pacific Asia Conference on Language, Information and Computation", month = dec, year = "2023", address = "Hong Kong, China", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2023.paclic-1.53/", pages = "535--542" }