@inproceedings{wei-etal-2024-structured, title = "Structured Optimal Brain Pruning for Large Language Models", author = "Wei, Jiateng and Lu, Quan and Jiang, Ning and Li, Siqi and Xiang, Jingyang and Chen, Jun and Liu, Yong", editor = "Al-Onaizan, Yaser and Bansal, Mohit and Chen, Yun-Nung", booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2024", address = "Miami, Florida, USA", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.emnlp-main.775/", doi = "10.18653/v1/2024.emnlp-main.775", pages = "13991--14007" }