Dataset Groups Activity Stream CC3M and CC12M CC3M and CC12M are used as datasets for training and evaluation BibTex: @dataset{Chenhao_Zheng_and_Jieyu_Zhang_and_Aniruddha_Kembhavi_and_Ranjay_Krishna_2024, abstract = {CC3M and CC12M are used as datasets for training and evaluation}, author = {Chenhao Zheng and Jieyu Zhang and Aniruddha Kembhavi and Ranjay Krishna}, doi = {10.57702/bq2f1bvq}, institution = {No Organization}, keyword = {'CC12M', 'CC3M', 'compositionality', 'vision-language models'}, month = {dec}, publisher = {TIB}, title = {CC3M and CC12M}, url = {https://service.tib.eu/ldmservice/dataset/cc3m-and-cc12m}, year = {2024} }