Dataset Groups Activity Stream TED The dataset is used for document-level neural machine translation. It contains 0.23M training sentences, 0.31M development sentences, and 0.21M test sentences. BibTex: @dataset{Xiaomian_Kang_and_Yang_Zhao_and_Jiajun_Zhang_and_Chengqing_Zong_2024, abstract = {The dataset is used for document-level neural machine translation. It contains 0.23M training sentences, 0.31M development sentences, and 0.21M test sentences.}, author = {Xiaomian Kang and Yang Zhao and Jiajun Zhang and Chengqing Zong}, doi = {10.57702/3qf38r9f}, institution = {No Organization}, keyword = {'Corpus', 'Document-level Neural Machine Translation', 'Machine Translation', 'TED'}, month = {dec}, publisher = {TIB}, title = {TED}, url = {https://service.tib.eu/ldmservice/dataset/ted}, year = {2024} }