Dataset Groups Activity Stream TaoMultimodal Dataset A large-scale dataset for multi-modal pretraining in Chinese, consisting of 3.1M image-text pairs from the mobile Taobao platform. BibTex: @dataset{Junyang_Lin_and_An_Yang_and_Yichang_Zhang_and_Jie_Liu_and_Jingren_Zhou_and_Hongxia_Yang_2024, abstract = {A large-scale dataset for multi-modal pretraining in Chinese, consisting of 3.1M image-text pairs from the mobile Taobao platform.}, author = {Junyang Lin and An Yang and Yichang Zhang and Jie Liu and Jingren Zhou and Hongxia Yang}, doi = {10.57702/q49virdf}, institution = {No Organization}, month = {nov}, publisher = {TIB}, title = {TaoMultimodal Dataset}, url = {https://service.tib.eu/ldmservice/dataset/taomultimodal-dataset}, year = {2024} }