@inproceedings{li-etal-2024-localization, title = "Localization vs. Semantics: Visual Representations in Unimodal and Multimodal Models", author = "Li, Zhuowan and Xie, Cihang and Van Durme, Benjamin and Yuille, Alan", editor = "Graham, Yvette and Purver, Matthew", booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)", month = mar, year = "2024", address = "St. Julian{'}s, Malta", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.eacl-long.146/", pages = "2378--2390" }