@inproceedings{le-scao-etal-2022-language, title = "What Language Model to Train if You Have One Million {GPU} Hours?", author = "Le Scao, Teven and Wang, Thomas and Hesslow, Daniel and Bekman, Stas and Bari, M Saiful and Biderman, Stella and Elsahar, Hady and Muennighoff, Niklas and Phang, Jason and Press, Ofir and Raffel, Colin and Sanh, Victor and Shen, Sheng and Sutawika, Lintang and Tae, Jaesung and Yong, Zheng Xin and Launay, Julien and Beltagy, Iz", editor = "Goldberg, Yoav and Kozareva, Zornitsa and Zhang, Yue", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2022", month = dec, year = "2022", address = "Abu Dhabi, United Arab Emirates", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2022.findings-emnlp.54/", doi = "10.18653/v1/2022.findings-emnlp.54", pages = "765--782" }