Dataset Groups Activity Stream Language Models of Spoken Dutch The dataset consists of subtitles of television shows provided by the Flemish public-service broadcaster VRT. The dataset is used to train language models of spoken Dutch. BibTex: @dataset{Lyan_Verwimp_and_Joris_Pelemans_and_Marieke_Lycke_and_Hugo_Van_hamme_and_Patrick_Wambacq_2024, abstract = {The dataset consists of subtitles of television shows provided by the Flemish public-service broadcaster VRT. The dataset is used to train language models of spoken Dutch.}, author = {Lyan Verwimp and Joris Pelemans and Marieke Lycke and Hugo Van hamme and Patrick Wambacq}, doi = {10.57702/i8b340q8}, institution = {No Organization}, keyword = {'language models', 'natural language processing', 'speech recognition', 'spoken Dutch'}, month = {dec}, publisher = {TIB}, title = {Language Models of Spoken Dutch}, url = {https://service.tib.eu/ldmservice/dataset/language-models-of-spoken-dutch}, year = {2024} }