Dataset Groups Activity Stream BIG-Bench Hard The BIG-Bench Hard dataset is derived from the original BIG-Bench evaluation suite, focusing on tasks that pose challenges to existing language models. BibTex: @dataset{Mirac_Suzgun_and_Nathan_Scales_and_Nathanael_Scharli_and_Sebastian_Gehrmann_and_Yi_Tay_and_Hyung_Won_Chung_and_Aakanksha_Chowdhery_and_Quoc_V_Le_and_Ed_Huai_hsin_Chi_and_Denny_Zhou_and_Jason_Wei_2024, abstract = {The BIG-Bench Hard dataset is derived from the original BIG-Bench evaluation suite, focusing on tasks that pose challenges to existing language models.}, author = {Mirac Suzgun and Nathan Scales and Nathanael Scharli and Sebastian Gehrmann and Yi Tay and Hyung Won Chung and Aakanksha Chowdhery and Quoc V. Le and Ed Huai hsin Chi and Denny Zhou and Jason Wei}, doi = {10.57702/jczynul3}, institution = {No Organization}, keyword = {'Benchmark', 'Language Models', 'Natural Language Processing', 'challenges', 'language models'}, month = {dec}, publisher = {TIB}, title = {BIG-Bench Hard}, url = {https://service.tib.eu/ldmservice/dataset/big-bench-hard}, year = {2024} }