Dataset Groups Activity Stream Okapi The dataset is used for instruction-tuning of LLMs in multiple languages using reinforcement learning from human feedback. BibTex: @dataset{Viet_Dac_Lai_and_Nghia_Trung_Ngo_and_Amir_Pouran_Ben_Veyseh_and_Hieu_Man_and_Franck_Dernoncourt_and_Trung_Bui_and_Thien_Huu_Nguyen_2024, abstract = {The dataset is used for instruction-tuning of LLMs in multiple languages using reinforcement learning from human feedback.}, author = {Viet Dac Lai and Nghia Trung Ngo and Amir Pouran Ben Veyseh and Hieu Man and Franck Dernoncourt and Trung Bui and Thien Huu Nguyen}, doi = {10.57702/veefae2j}, institution = {No Organization}, keyword = {'Human Feedback', 'Instruction Tuning', 'LLMs', 'Reinforcement Learning'}, month = {dec}, publisher = {TIB}, title = {Okapi}, url = {https://service.tib.eu/ldmservice/dataset/okapi}, year = {2024} }