Dataset Groups Activity Stream OntoNotes dataset The OntoNotes dataset contains 3.4M automatically labeled entity mentions for training and 11k manually annotated instances that are split into 8k for dev set and 2k for test set. BibTex: @dataset{Bangzheng_Li_and_Wenpeng_Yin_and_Muhao_Chen_2024, abstract = {The OntoNotes dataset contains 3.4M automatically labeled entity mentions for training and 11k manually annotated instances that are split into 8k for dev set and 2k for test set.}, author = {Bangzheng Li and Wenpeng Yin and Muhao Chen}, doi = {10.57702/tle1s0pp}, institution = {No Organization}, keyword = {'OntoNotes', 'dataset', 'named entity recognition'}, month = {dec}, publisher = {TIB}, title = {OntoNotes dataset}, url = {https://service.tib.eu/ldmservice/dataset/ontonotes-dataset}, year = {2024} }