@misc{cascantebonilla2024naturallanguageinferenceimproves, title={Natural Language Inference Improves Compositionality in Vision-Language Models}, author={Paola Cascante-Bonilla and Yu Hou and Yang Trista Cao and Hal Daumé III au2 and Rachel Rudinger}, year={2024}, eprint={2410.22315}, archivePrefix={arXiv}, primaryClass={cs.CL}, url={https://arxiv.org/abs/2410.22315}, }