{"article":{"@attributes":{"key":"journals\/corr\/abs-2205-09256","publtype":"informal","mdate":"2024-04-11"},"author":["Liangke Gui","Qiuyuan Huang","Alex Hauptmann 0001","Yonatan Bisk","Jianfeng Gao 0001"],"title":"Training Vision-Language Transformers from Captions Alone.","year":"2022","volume":"abs\/2205.09256","journal":"CoRR","ee":"https:\/\/doi.org\/10.48550\/arXiv.2205.09256","url":"db\/journals\/corr\/corr2205.html#abs-2205-09256"}}