@inproceedings{garg-etal-2019-learning, title = "Learning to Relate from Captions and Bounding Boxes", author = "Garg, Sarthak and Moniz, Joel Ruben Antony and Aviral, Anshu and Bollimpalli, Priyatham", editor = "Korhonen, Anna and Traum, David and M{\`a}rquez, Llu{\'i}s", booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics", month = jul, year = "2019", address = "Florence, Italy", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/P19-1660/", doi = "10.18653/v1/P19-1660", pages = "6597--6603" }