@inproceedings{ditchfield-ogle-mitkov-2025-comparative, title = "A Comparative Study of Vision Transformers and Multimodal Language Models for Violence Detection in Videos", author = "Ditchfield-Ogle, Tomas and Mitkov, Ruslan", editor = "Picazo-Izquierdo, Alicia and Estevanell-Valladares, Ernesto Luis and Mitkov, Ruslan and Guillena, Rafael Mu{\~n}oz and Cerd{\'a}, Ra{\'u}l Garc{\'i}a", booktitle = "Proceedings of the First Workshop on Comparative Performance Evaluation: From Rules to Language Models", month = sep, year = "2025", address = "Varna, Bulgaria", publisher = "INCOMA Ltd., Shoumen, Bulgaria", url = "https://aclanthology.org/2025.r2lm-1.2/", pages = "10--20" }