Dataset Groups Activity Stream WikiWeb2M WikiWeb2M is a page-level multimodal Wikipedia dataset. BibTex: @dataset{Andrea_Burns_and_Krishna_Srinivasan_and_Joshua_Ainslie_and_Geoff_Brown_and_Bryan_A_Plummer_and_Kate_Saenko_and_Jianmo_Ni_and_Mandy_Guo_2025, abstract = {WikiWeb2M is a page-level multimodal Wikipedia dataset.}, author = {Andrea Burns and Krishna Srinivasan and Joshua Ainslie and Geoff Brown and Bryan A. Plummer and Kate Saenko and Jianmo Ni and Mandy Guo}, doi = {10.57702/8b7m43mm}, institution = {No Organization}, keyword = {'multimodal wikipedia', 'page-level dataset', 'question answering'}, month = {jan}, publisher = {TIB}, title = {WikiWeb2M}, url = {https://service.tib.eu/ldmservice/dataset/wikiweb2m}, year = {2025} }