Dataset Groups Activity Stream English Noun Dataset The dataset used for clustering contains the 2000 most frequent nouns in the British National Corpus (BNC) and the English Gigaword corpus. BibTex: @dataset{Ekaterina_Shutova_and_Patricia_Lichtenstein_2024, abstract = {The dataset used for clustering contains the 2000 most frequent nouns in the British National Corpus (BNC) and the English Gigaword corpus.}, author = {Ekaterina Shutova and Patricia Lichtenstein}, doi = {10.57702/uoj6k3ha}, institution = {No Organization}, keyword = {'natural language processing', 'noun clustering', 'text mining'}, month = {dec}, publisher = {TIB}, title = {English Noun Dataset}, url = {https://service.tib.eu/ldmservice/dataset/english-noun-dataset}, year = {2024} }