Dataset Groups Activity Stream Open Subtitles dataset The Open Subtitles dataset consists of transcriptions of spoken dialog in movies and television shows. BibTex: @dataset{Pavel_Sountsov_and_Sunita_Sarawagi_2024, abstract = {The Open Subtitles dataset consists of transcriptions of spoken dialog in movies and television shows.}, author = {Pavel Sountsov and Sunita Sarawagi}, doi = {10.57702/g079m54y}, institution = {No Organization}, keyword = {'Natural Language Processing', 'Speech Recognition'}, month = {dec}, publisher = {TIB}, title = {Open Subtitles dataset}, url = {https://service.tib.eu/ldmservice/dataset/open-subtitles-dataset}, year = {2024} }