@inproceedings{jo-myaeng-2020-roles, title = "Roles and Utilization of Attention Heads in Transformer-based Neural Language Models", author = "Jo, Jae-young and Myaeng, Sung-Hyon", editor = "Jurafsky, Dan and Chai, Joyce and Schluter, Natalie and Tetreault, Joel", booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics", month = jul, year = "2020", address = "Online", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2020.acl-main.311/", doi = "10.18653/v1/2020.acl-main.311", pages = "3404--3417" }