Dataset Groups Activity Stream CMB-Exam A large-scale Chinese benchmark for evaluating medical large language models. The dataset consists of 280,839 samples, with 74 tasks, and covers 24 departments and 150 diseases. BibTex: @dataset{Junling_Liu_and_Peilin_Zhou_and_Yining_Hua_and_Dading_Chong_and_Zhongyu_Tian_and_Andrew_Liu_and_Helin_Wang_and_Chenyu_You_and_Zhenhua_Guo_and_Lei_Zhu_2024, abstract = {A large-scale Chinese benchmark for evaluating medical large language models. The dataset consists of 280,839 samples, with 74 tasks, and covers 24 departments and 150 diseases.}, author = {Junling Liu and Peilin Zhou and Yining Hua and Dading Chong and Zhongyu Tian and Andrew Liu and Helin Wang and Chenyu You and Zhenhua Guo and Lei Zhu}, doi = {10.57702/06b9aln5}, institution = {No Organization}, keyword = {'Medical Diagnosis', 'Question Answering'}, month = {dec}, publisher = {TIB}, title = {CMB-Exam}, url = {https://service.tib.eu/ldmservice/dataset/cmb-exam}, year = {2024} }