@inproceedings{voloshina-etal-2023-language, title = "Are Language-and-Vision Transformers Sensitive to Discourse? A Case Study of {V}i{LBERT}", author = "Voloshina, Ekaterina and Ilinykh, Nikolai and Dobnik, Simon", editor = "Gatt, Albert and Gardent, Claire and Cripwell, Liam and Belz, Anya and Borg, Claudia and Erdem, Aykut and Erdem, Erkut", booktitle = "Proceedings of the Workshop on Multimodal, Multilingual Natural Language Generation and Multilingual WebNLG Challenge (MM-NLG 2023)", month = sep, year = "2023", address = "Prague, Czech Republic", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2023.mmnlg-1.4/", pages = "28--38" }