Dataset Groups Activity Stream High Quality Image Text Pairs The High Quality Image Text Pairs (HQITP-134M) dataset consists of 134 million diverse and high-quality images paired with descriptive captions and titles. BibTex: @dataset{Kanchana_Ranasinghe_and_Brandon_McKinzie_and_Sachin_Ravi_and_Yinfei_Yang_and_Alexander_Toshev_and_Jonathon_Shlens_2024, abstract = {The High Quality Image Text Pairs (HQITP-134M) dataset consists of 134 million diverse and high-quality images paired with descriptive captions and titles.}, author = {Kanchana Ranasinghe and Brandon McKinzie and Sachin Ravi and Yinfei Yang and Alexander Toshev and Jonathon Shlens}, doi = {10.57702/3jwb7syv}, institution = {No Organization}, keyword = {'image captioning', 'large-scale image-text pairs', 'visual question answering'}, month = {dec}, publisher = {TIB}, title = {High Quality Image Text Pairs}, url = {https://service.tib.eu/ldmservice/dataset/high-quality-image-text-pairs}, year = {2024} }