@inproceedings{goldman-etal-2024-unpacking, title = "Unpacking Tokenization: Evaluating Text Compression and its Correlation with Model Performance", author = "Goldman, Omer and Caciularu, Avi and Eyal, Matan and Cao, Kris and Szpektor, Idan and Tsarfaty, Reut", editor = "Ku, Lun-Wei and Martins, Andre and Srikumar, Vivek", booktitle = "Findings of the Association for Computational Linguistics: ACL 2024", month = aug, year = "2024", address = "Bangkok, Thailand", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.findings-acl.134/", doi = "10.18653/v1/2024.findings-acl.134", pages = "2274--2286" }