@inproceedings{fan-etal-2024-muffin, title = "Muffin or {C}hihuahua? Challenging Multimodal Large Language Models with Multipanel {VQA}", author = "Fan, Yue and Gu, Jing and Zhou, Kaiwen and Yan, Qianqi and Jiang, Shan and Kuo, Ching-Chen and Zhao, Yang and Guan, Xinze and Wang, Xin", editor = "Ku, Lun-Wei and Martins, Andre and Srikumar, Vivek", booktitle = "Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)", month = aug, year = "2024", address = "Bangkok, Thailand", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.acl-long.370/", doi = "10.18653/v1/2024.acl-long.370", pages = "6845--6863" }