@inproceedings{wang-etal-2025-faster, title = "Faster and Better {LLM}s via Latency-Aware Test-Time Scaling", author = "Wang, Zili and Zhang, Tianyu and Bai, Haoli and Hou, Lu and Yu, Xianzhi and Liu, Wulong and Xiang, Shiming and Zhu, Lei", editor = "Christodoulopoulos, Christos and Chakraborty, Tanmoy and Rose, Carolyn and Peng, Violet", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2025.findings-emnlp.928/", pages = "17124--17137", ISBN = "979-8-89176-335-7" }