Dataset Groups Activity Stream VILLA The dataset used in the paper for vision-and-language representation learning. BibTex: @dataset{Zhe_Gan_and_Yen-Chun_Chen_and_Linjie_Li_and_Chen_Zhu_and_Yu_Cheng_and_Jingjing_Liu_2024, abstract = {The dataset used in the paper for vision-and-language representation learning.}, author = {Zhe Gan and Yen-Chun Chen and Linjie Li and Chen Zhu and Yu Cheng and Jingjing Liu}, doi = {10.57702/1i9ozblf}, institution = {No Organization}, keyword = {'adversarial training', 'representation learning', 'vision-and-language'}, month = {dec}, publisher = {TIB}, title = {VILLA}, url = {https://service.tib.eu/ldmservice/dataset/villa}, year = {2024} }