Dataset Groups Activity Stream SIGHAN Datasets The SIGHAN datasets are used for Chinese Spelling Check (CSC) task, with a limited number of Chinese characters and their corresponding errors. BibTex: @dataset{Wangxuan_Institute_of_Computer_Technology_Peking_University_and_Center_for_Data_Science_Peking_University_and_The_MOE_Key_Laboratory_of_Computational_Linguistics_Peking_University_2024, abstract = {The SIGHAN datasets are used for Chinese Spelling Check (CSC) task, with a limited number of Chinese characters and their corresponding errors.}, author = {Wangxuan Institute of Computer Technology, Peking University and Center for Data Science, Peking University and The MOE Key Laboratory of Computational Linguistics, Peking University}, doi = {10.57702/yoqrix0i}, institution = {No Organization}, keyword = {'Chinese Language Processing', 'Chinese Spelling Check', 'Natural Language Processing'}, month = {dec}, publisher = {TIB}, title = {SIGHAN Datasets}, url = {https://service.tib.eu/ldmservice/dataset/sighan-datasets}, year = {2024} }