Dataset Groups Activity Stream CoVoST2 The dataset used for the speech translation task, which consists of multilingual speech data. BibTex: @dataset{Puyuan_Peng_and_Brian_Yan_and_Shinji_Watanabe_and_David_Harwath_2025, abstract = {The dataset used for the speech translation task, which consists of multilingual speech data.}, author = {Puyuan Peng and Brian Yan and Shinji Watanabe and David Harwath}, doi = {10.57702/c686okph}, institution = {No Organization}, keyword = {'CoVoST2', 'Speech Recognition', 'multilingual speech', 'translation'}, month = {jan}, publisher = {TIB}, title = {CoVoST2}, url = {https://service.tib.eu/ldmservice/dataset/covost2}, year = {2025} }