Dataset Groups Activity Stream UKWaC and Wackypedia corpora The dataset used in this paper is a large text corpus compiled from UKWaC and Wackypedia corpora. BibTex: @dataset{Ka_Chun_Lam_and_Francisco_Pereira_and_Maryam_Vaziri-Pashkam_and_Kristin_Woodard_and_Emalie_McMahon_2024, abstract = {The dataset used in this paper is a large text corpus compiled from UKWaC and Wackypedia corpora.}, author = {Ka Chun Lam and Francisco Pereira and Maryam Vaziri-Pashkam and Kristin Woodard and Emalie McMahon}, doi = {10.57702/dr3xmeq3}, institution = {No Organization}, keyword = {'corpus', 'natural language processing', 'text analysis', 'text corpora'}, month = {dec}, publisher = {TIB}, title = {UKWaC and Wackypedia corpora}, url = {https://service.tib.eu/ldmservice/dataset/ukwac-and-wackypedia-corpora}, year = {2024} }