Dataset Groups Activity Stream MSVD-QA The MSVD-QA dataset is a benchmark for video question answering, containing 1,970 videos with multiple-choice questions. BibTex: @dataset{Xu_D;_Zhao_Z;_Xiao_J;_Wu_F;_Zhang_H;_He_X;_and_Zhuang_Y_2024, abstract = {The MSVD-QA dataset is a benchmark for video question answering, containing 1,970 videos with multiple-choice questions.}, author = {Xu, D.; Zhao, Z.; Xiao, J.; Wu, F.; Zhang, H.; He, X.; and Zhuang, Y.}, doi = {10.57702/ugauh7lr}, institution = {No Organization}, keyword = {'Multimodal Learning', 'Multiple-Choice Questions', 'Question Answering', 'Video Question Answering', 'VideoQA', 'multimodal learning', 'natural language form', 'video question answering', 'video-language'}, month = {dec}, publisher = {TIB}, title = {MSVD-QA}, url = {https://service.tib.eu/ldmservice/dataset/msvd-qa}, year = {2024} }