Dataset Groups Activity Stream LAMBADA The dataset used in the paper is a corpus of text containing approximately 10,000 examples, each a sequence of sentences extracted from books. BibTex: @dataset{Denis_Paperno_and_Germán_Kruszewski_and_Angeliki_Lazaridou_and_Quan_Ngoc_Pham_and_Raffaella_Bernardi_and_Sandro_Pezzelle_and_Marco_Baroni_and_Gemma_Boleda_and_Raquel_Fernández_2024, abstract = {The dataset used in the paper is a corpus of text containing approximately 10,000 examples, each a sequence of sentences extracted from books.}, author = {Denis Paperno and Germán Kruszewski and Angeliki Lazaridou and Quan Ngoc Pham and Raffaella Bernardi and Sandro Pezzelle and Marco Baroni and Gemma Boleda and Raquel Fernández}, doi = {10.57702/vh6wq2i6}, institution = {No Organization}, keyword = {'Conversational AI', 'LAMBADA', 'Natural Language Processing', 'Question Answering', 'Text Data', 'discourse context', 'word prediction'}, month = {dec}, publisher = {TIB}, title = {LAMBADA}, url = {https://service.tib.eu/ldmservice/dataset/lambada}, year = {2024} }