Dataset Groups Activity Stream Scientific Articles Corpus The dataset used in this research is a large-scale academic corpus containing titles and abstracts of approximately 70 million scientific articles. BibTex: @dataset{HJ_Meijer_and_J_Truong_and_R_Karimi_2024, abstract = {The dataset used in this research is a large-scale academic corpus containing titles and abstracts of approximately 70 million scientific articles.}, author = {H.J. Meijer and J. Truong and R. Karimi}, doi = {10.57702/afihonf6}, institution = {No Organization}, keyword = {'Academic Corpus', 'Scientific Articles', 'TFIDF', 'Word Embeddings'}, month = {dec}, publisher = {TIB}, title = {Scientific Articles Corpus}, url = {https://service.tib.eu/ldmservice/dataset/scientific-articles-corpus}, year = {2024} }