@inproceedings{zhang-etal-2025-dorm, title = "{DORM}: Preference Data Weights Optimization for Reward Modeling in {LLM} Alignment", author = "Zhang, Rongzhi and Zhang, Chenwei and Zhang, Xinyang and Qiu, Liang and Jiang, Haoming and Zhuang, Yuchen and Zhang, Qingru and Yun, Hyokun and Li, Xian and Yin, Bing and Zhao, Tuo and Zhang, Chao", editor = "Christodoulopoulos, Christos and Chakraborty, Tanmoy and Rose, Carolyn and Peng, Violet", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2025.findings-emnlp.1237/", pages = "22721--22739", ISBN = "979-8-89176-335-7" }