Dataset Groups Activity Stream Webvid-10M The dataset used for training the video model consists of Webvid-10M, a large-scale dataset of short videos with textual descriptions. BibTex: @dataset{Max_Bain_and_Arsha_Nagrani_and_G¨ul_Varol_and_Andrew_Zisserman_2024, abstract = {The dataset used for training the video model consists of Webvid-10M, a large-scale dataset of short videos with textual descriptions.}, author = {Max Bain and Arsha Nagrani and G¨ul Varol and Andrew Zisserman}, doi = {10.57702/lral74s0}, institution = {No Organization}, keyword = {'dataset', 'large-scale', 'short videos', 'video'}, month = {dec}, publisher = {TIB}, title = {Webvid-10M}, url = {https://service.tib.eu/ldmservice/dataset/webvid-10m}, year = {2024} }