Dataset Groups Activity Stream CCNet The dataset used in the paper to train the Toolformer model. BibTex: @dataset{Julien_Launay_and_Elena_Tommasone_and_Baptiste_Pannier_and_François_Boniface_and_Amélie_Chatelain_and_Alessandro_Cappelli_and_Iacopo_Poli_and_Djamé_Seddah_2024, abstract = {The dataset used in the paper to train the Toolformer model.}, author = {Julien Launay and Elena Tommasone and Baptiste Pannier and François Boniface and Amélie Chatelain and Alessandro Cappelli and Iacopo Poli and Djamé Seddah}, doi = {10.57702/ud3pyqy2}, institution = {No Organization}, keyword = {'CCNet', 'French Language', 'Language models', 'Text Data', 'Text datasets'}, month = {dec}, publisher = {TIB}, title = {CCNet}, url = {https://service.tib.eu/ldmservice/dataset/ccnet}, year = {2024} }