@article{qin2023gluegen,
title={GlueGen: Plug and Play Multi-modal Encoders for X-to-image Generation},
author={Qin, Can and Yu, Ning and Xing, Chen and Zhang, Shu and Chen, Zeyuan and Ermon, Stefano and Fu, Yun and Xiong, Caiming and Xu, Ran},
journal={arXiv preprint arXiv:2303.10056},
year={2023}
}