Dataset Groups Activity Stream Lang-84 The dataset used in this paper is a collection of parallel sentence pairs from 96 different native languages, with at least 10,000 sentence pairs per language. BibTex: @dataset{Yuanyuan_Zhao_and_Weiwei_Sun_and_Xiaojun_Wan_2025, abstract = {The dataset used in this paper is a collection of parallel sentence pairs from 96 different native languages, with at least 10,000 sentence pairs per language.}, author = {Yuanyuan Zhao and Weiwei Sun and Xiaojun Wan}, doi = {10.57702/uyqnrio1}, institution = {No Organization}, keyword = {'native languages', 'parallel sentence pairs', 'second language acquisition'}, month = {jan}, publisher = {TIB}, title = {Lang-84}, url = {https://service.tib.eu/ldmservice/dataset/lang-84}, year = {2025} }