@misc{cascantebonilla2023going, title={Going Beyond Nouns With Vision & Language Models Using Synthetic Data}, author={Paola Cascante-Bonilla and Khaled Shehada and James Seale Smith and Sivan Doveh and Donghyun Kim and Rameswar Panda and Gül Varol and Aude Oliva and Vicente Ordonez and Rogerio Feris and Leonid Karlinsky}, year={2023}, eprint={2303.17590}, archivePrefix={arXiv}, primaryClass={cs.CV} }