@article{cognetta-okazaki-2025-tokenization, title = "Tokenization as Finite-State Transduction", author = "Cognetta, Marco and Okazaki, Naoaki", journal = "Computational Linguistics", volume = "51", number = "4", month = dec, year = "2025", address = "Cambridge, MA", publisher = "MIT Press", url = "https://aclanthology.org/2025.cl-4.2/", doi = "10.1162/coli.a.23", pages = "1119--1149" }