Dataset Groups Activity Stream AlpacaFarm The AlpacaFarm dataset is a large-scale dataset for preference optimization, which consists of a set of instructions and their corresponding responses. BibTex: @dataset{Simeng_Sun_and_Dhawal_Gupta_and_Mohit_Iyyer_2024, abstract = {The AlpacaFarm dataset is a large-scale dataset for preference optimization, which consists of a set of instructions and their corresponding responses.}, author = {Simeng Sun and Dhawal Gupta and Mohit Iyyer}, doi = {10.57702/mm36ydlf}, institution = {No Organization}, keyword = {'Human Feedback', 'Language Model Alignment', 'Language Model Training', 'Preference Optimization', 'human feedback', 'instruction following', 'language model', 'question answering', 'task-oriented dialogue'}, month = {dec}, publisher = {TIB}, title = {AlpacaFarm}, url = {https://service.tib.eu/ldmservice/dataset/alpacafarm}, year = {2024} }