Dataset Groups Activity Stream UltraRM-13B The UltraRM-13B dataset is a collection of human feedback for language model training. BibTex: @dataset{Zeqiu_Wu_and_Yushi_Hu_and_Weijia_Shi_and_Nouha_Dziri_and_Alane_Suhr_and_Prithviraj_Ammanabrolu_and_Noah_A_Smith_and_Mari_Ostendorf_and_Hannaneh_Hajishirzi_2024, abstract = {The UltraRM-13B dataset is a collection of human feedback for language model training.}, author = {Zeqiu Wu and Yushi Hu and Weijia Shi and Nouha Dziri and Alane Suhr and Prithviraj Ammanabrolu and Noah A. Smith and Mari Ostendorf and Hannaneh Hajishirzi}, doi = {10.57702/qljyhr74}, institution = {No Organization}, keyword = {'Human Feedback', 'Language Model Training'}, month = {dec}, publisher = {TIB}, title = {UltraRM-13B}, url = {https://service.tib.eu/ldmservice/dataset/ultrarm-13b}, year = {2024} }