Dataset Groups Activity Stream YFCC15M Mid-scale 15M data is a good balance of the training cost and performance. The dataset is used for Contrastive Language-Image Pretraining (CLIP) and its variants. BibTex: @dataset{Yufeng_Cui_and_Lichen_Zhao_and_Feng_Liang_and_Yangguang_Li_and_Jing_Shao_2024, abstract = {Mid-scale 15M data is a good balance of the training cost and performance. The dataset is used for Contrastive Language-Image Pretraining (CLIP) and its variants.}, author = {Yufeng Cui and Lichen Zhao and Feng Liang and Yangguang Li and Jing Shao}, doi = {10.57702/9tsbls5f}, institution = {No Organization}, keyword = {'Contrastive Learning', 'Image-Text Pre-training', 'Visual Models'}, month = {dec}, publisher = {TIB}, title = {YFCC15M}, url = {https://service.tib.eu/ldmservice/dataset/yfcc15m}, year = {2024} }