Dataset Groups Activity Stream Laion-5b A large-scale dataset of text and images for training next-generation language models. BibTex: @dataset{C_Schuhmann_and_R_Beaumont_and_R_Vencu_and_C_Gordon_and_R_Wightman_and_M_Cherti_and_T_Coombes_and_A_Katta_and_C_Mullis_and_M_Wortsman_2024, abstract = {A large-scale dataset of text and images for training next-generation language models.}, author = {C. Schuhmann and R. Beaumont and R. Vencu and C. Gordon and R. Wightman and M. Cherti and T. Coombes and A. Katta and C. Mullis and M. Wortsman}, doi = {10.57702/a73taznq}, institution = {No Organization}, keyword = {'Language Models', 'Scene Understanding', 'Text-Image Models'}, month = {dec}, publisher = {TIB}, title = {Laion-5b}, url = {https://service.tib.eu/ldmservice/dataset/laion-5b}, year = {2024} }