Dataset Groups Activity Stream DiDeMo The DiDeMo dataset is a large-scale video-text dataset, containing 10,000 videos and 40,000 annotations. BibTex: @dataset{H_Luo_and_L_Ji_and_M_Zhong_and_Y_Chen_and_W_Lei_and_D_Duan_and_T_Li_and_J_Bharti_and_M_Zhou_2024, abstract = {The DiDeMo dataset is a large-scale video-text dataset, containing 10,000 videos and 40,000 annotations.}, author = {H. Luo and L. Ji and M. Zhong and Y. Chen and W. Lei and D. Duan and T. Li and J. Bharti and M. Zhou}, doi = {10.57702/d8wjkgdy}, institution = {No Organization}, keyword = {'DiDeMo', 'Large-Scale Dataset', 'Text Video Retrieval', 'Video-Text Retrieval', 'multimodal learning', 'temporal activity localization', 'text-video retrieval', 'video analysis'}, month = {dec}, publisher = {TIB}, title = {DiDeMo}, url = {https://service.tib.eu/ldmservice/dataset/didemo}, year = {2024} }