Dataset Groups Activity Stream AISHELL-1 The AISHELL-1 dataset is a Mandarin speech corpus, consisting of 178 hours of speech, with 11 domains and 400 speakers from different accent areas in China. BibTex: @dataset{Hui_Bu_and_Jiayu_Du_and_Xingyu_Na_and_Bengu_Wu_and_Hao_Zheng_2024, abstract = {The AISHELL-1 dataset is a Mandarin speech corpus, consisting of 178 hours of speech, with 11 domains and 400 speakers from different accent areas in China.}, author = {Hui Bu and Jiayu Du and Xingyu Na and Bengu Wu and Hao Zheng}, doi = {10.57702/625tb6gv}, institution = {No Organization}, keyword = {'AISHELL', 'AISHELL-1', 'ASR', 'Audio', 'Chinese Speech', 'Mandarin', 'Mandarin speech corpus', 'Speech Corpus', 'Speech Recognition'}, month = {dec}, publisher = {TIB}, title = {AISHELL-1}, url = {https://service.tib.eu/ldmservice/dataset/aishell-1}, year = {2024} }