Dataset Groups Activity Stream LAION COCO 600M The dataset used for training the text-to-video model consists of 20 million videos and 600 million images. BibTex: @dataset{Haoxin_Chen_and_Menghan_Xia_and_Yingqing_He_and_Yong_Zhang_and_Xiaodong_Cun_and_Shaoshu_Yang_and_Jinbo_Xing_and_Yaofang_Liu_and_Qifeng_Chen_and_Xintao_Wang_and_Ying_Shan_2024, abstract = {The dataset used for training the text-to-video model consists of 20 million videos and 600 million images.}, author = {Haoxin Chen and Menghan Xia and Yingqing He and Yong Zhang and Xiaodong Cun and Shaoshu Yang and Jinbo Xing and Yaofang Liu and Qifeng Chen and Xintao Wang and Ying Shan}, doi = {10.57702/nofk4rod}, institution = {No Organization}, keyword = {'dataset', 'image', 'large-scale', 'video'}, month = {dec}, publisher = {TIB}, title = {LAION COCO 600M}, url = {https://service.tib.eu/ldmservice/dataset/laion-coco-600m}, year = {2024} }