Dataset Groups Activity Stream Microsoft Video Description Corpus (MSVD) The MSVD dataset is a public video captioning benchmark that contains 1,970 short video clips with 80,000 descriptions. BibTex: @dataset{Yuyu_Guo_and_Jingqiu_Zhang_and_Lianli_Gao_2024, abstract = {The MSVD dataset is a public video captioning benchmark that contains 1,970 short video clips with 80,000 descriptions.}, author = {Yuyu Guo and Jingqiu Zhang and Lianli Gao}, doi = {10.57702/0two3jmq}, institution = {No Organization}, keyword = {'Corpus', 'Description', 'Video Captioning'}, month = {dec}, publisher = {TIB}, title = {Microsoft Video Description Corpus (MSVD)}, url = {https://service.tib.eu/ldmservice/dataset/microsoft-video-description-corpus--msvd-}, year = {2024} }