@inproceedings{tay-etal-2023-transcending, title = "Transcending Scaling Laws with 0.1{\%} Extra Compute", author = "Tay, Yi and Wei, Jason and Chung, Hyung and Tran, Vinh and So, David and Shakeri, Siamak and Garcia, Xavier and Zheng, Steven and Rao, Jinfeng and Chowdhery, Aakanksha and Zhou, Denny and Metzler, Donald and Petrov, Slav and Houlsby, Neil and Le, Quoc and Dehghani, Mostafa", editor = "Bouamor, Houda and Pino, Juan and Bali, Kalika", booktitle = "Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2023.emnlp-main.91/", doi = "10.18653/v1/2023.emnlp-main.91", pages = "1471--1486" }