@inproceedings{zhang-etal-2025-safeconf, title = "{S}afe{C}onf: A Confidence-Calibrated Safety Self-Evaluation Method for Large Language Models", author = "Zhang, Bo and Gao, Cong and Yang, Linkang and Han, Bingxu and Hu, Minghao and Luo, Zhunchen and Geng, Guotong and Bai, Xiaoying and Zhang, Jun and Yao, Wen and Wang, Zhong", editor = "Christodoulopoulos, Christos and Chakraborty, Tanmoy and Rose, Carolyn and Peng, Violet", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2025.findings-emnlp.186/", pages = "3483--3495", ISBN = "979-8-89176-335-7" }