Dataset Groups Activity Stream 1 Billion Word Language Model Benchmark The 1 Billion Word Language Model Benchmark is a dataset used for measuring progress in statistical language modeling, consisting of a large collection of text data. BibTex: @dataset{Ciprian_Chelba_and_Tomas_Mikolov_and_Mike_Schuster_and_Qi_Ge_and_Thorsten_Brants_and_Phillipp_Koehn_and_Tony_Robinson_2024, abstract = {The 1 Billion Word Language Model Benchmark is a dataset used for measuring progress in statistical language modeling, consisting of a large collection of text data.}, author = {Ciprian Chelba and Tomas Mikolov and Mike Schuster and Qi Ge and Thorsten Brants and Phillipp Koehn and Tony Robinson}, doi = {10.57702/969ckti0}, institution = {No Organization}, month = {nov}, publisher = {TIB}, title = {1 Billion Word Language Model Benchmark}, url = {https://service.tib.eu/ldmservice/dataset/1-billion-word-language-model-benchmark}, year = {2024} }