Dataset Groups Activity Stream MARIO-LAION The MARIO-LAION dataset is a subset of the LAION-400M dataset, containing 9,194,613 high-quality text images with corresponding captions. BibTex: @dataset{Christoph_Schuhmann_and_Richard_Vencu_and_Romain_Beaumont_and_Robert_Kaczmarczyk_and_Clayton_Mullis_and_Aarush_Katta_and_Theo_Coombes_and_Jenia_Jitsev_and_Aran_Komatsuzaki_2024, abstract = {The MARIO-LAION dataset is a subset of the LAION-400M dataset, containing 9,194,613 high-quality text images with corresponding captions.}, author = {Christoph Schuhmann and Richard Vencu and Romain Beaumont and Robert Kaczmarczyk and Clayton Mullis and Aarush Katta and Theo Coombes and Jenia Jitsev and Aran Komatsuzaki}, doi = {10.57702/nirgollz}, institution = {No Organization}, keyword = {'captions', 'image-text pairs', 'text recognition'}, month = {dec}, publisher = {TIB}, title = {MARIO-LAION}, url = {https://service.tib.eu/ldmservice/dataset/mario-laion}, year = {2024} }