@inproceedings{lin24eccv, title = {Evaluating Text-to-Visual Generation with Image-to-Text Generation}, author = {Zhiqiu Lin and Deepak Pathak and Baiqi Li and Jiayao Li and Xide Xia and Graham Neubig and Pengchuan Zhang and Deva Ramanan}, booktitle = {The European Conference on Computer Vision (ECCV)}, address = {Milan, Italy}, month = {September}, url = {https://arxiv.org/abs/2404.01291}, year = {2024} }