Dataset Groups Activity Stream Librispeech The Librispeech dataset is a large-scale speaker-dependent speech corpus containing 1080 hours of speech, 5600 utterances, and 1000 speakers. BibTex: @dataset{Vassil_Panayotov_and_Guoguo_Chen_and_Daniel_Povey_and_Sanjeev_Khudanpur_2024, abstract = {The Librispeech dataset is a large-scale speaker-dependent speech corpus containing 1080 hours of speech, 5600 utterances, and 1000 speakers.}, author = {Vassil Panayotov and Guoguo Chen and Daniel Povey and Sanjeev Khudanpur}, doi = {10.57702/q6hix4xm}, institution = {No Organization}, keyword = {'ASR', 'ASR corpus', 'Audio', 'Audio Book Recordings', 'Audio Data', 'Audio Recordings', 'Corpus', 'Large-scale', 'Librispeech', 'Machine Translation', 'Multilingual', 'Public Domain', 'Recognition', 'Speech', 'Speech Recognition', 'Speech Research', 'Unlabeled Data', 'audio', 'audio books', 'audio corpus', 'audio dataset', 'audio processing', 'corpus', 'domain mismatch', 'librispeech', 'recognition', 'self-supervised learning', 'speech', 'speech recognition'}, month = {nov}, publisher = {TIB}, title = {Librispeech}, url = {https://service.tib.eu/ldmservice/dataset/librispeech}, year = {2024} }