Dataset Groups Activity Stream OSCAR corpus The dataset used in this study is the OSCAR corpus, which is a multilingual corpus that is obtained by filtering of the Common Crawl corpus. BibTex: @dataset{Cagri_Toraman_and_Eyup_Halit_Yilmaz_and_Furkan_Şahinuç_and_Oguzan_Ozcelik_2024, abstract = {The dataset used in this study is the OSCAR corpus, which is a multilingual corpus that is obtained by filtering of the Common Crawl corpus.}, author = {Cagri Toraman and Eyup Halit Yilmaz and Furkan Şahinuç and Oguzan Ozcelik}, doi = {10.57702/o8r3jeh0}, institution = {No Organization}, keyword = {'Corpus', 'Multilingual', 'OSCAR'}, month = {dec}, publisher = {TIB}, title = {OSCAR corpus}, url = {https://service.tib.eu/ldmservice/dataset/oscar-corpus}, year = {2024} }