@techreport{TR-IC-PFG-22-36, number = {IC-PFG-22-36}, author = {Thales Rog{\'e}rio Sales Almeida and Rodrigo Frasseto Nogueira and H{\'e}lio Pedrini}, title = {{An Analysis of the Currently Available Text-to-Image Models}}, month = {December}, year = {2022}, institution = {Institute of Computing, University of Campinas}, note = {In English, 11 pages. \par\selectlanguage{English}\textbf{Abstract} This work aims to study some of the most prominent publicly available models for the text-to-image generation task. In addition, we investigated whether an ensemble of these models can achieve better results using a CLIP model as a ranker. To perform these experiments, we selected two available models that performed well on the public MS-COCO benchmark. We also experimented with Stable Diffusion, a diffusion model that became popular due to the quality of the images it generates. We evaluated each model and the ensembles in subsets of the MS-COCO and FLICKR datasets. } }