Dataset Groups Activity Stream FastText The FastText dataset is a subword token embedding model. It produces a vector representation of a word based on composing embeddings of the character n-grams composing the word. BibTex: @dataset{Piotr_Bojanowski_and_Edouard_Grave_and_Armand_Joulin_and_Tomas_Mikolov_2024, abstract = {The FastText dataset is a subword token embedding model. It produces a vector representation of a word based on composing embeddings of the character n-grams composing the word.}, author = {Piotr Bojanowski and Edouard Grave and Armand Joulin and Tomas Mikolov}, doi = {10.57702/ce7c3j4u}, institution = {No Organization}, keyword = {'FastText', 'Subword Modeling', 'Text Classification', 'Word Embeddings', 'language modeling', 'subword token embeddings', 'text classification'}, month = {dec}, publisher = {TIB}, title = {FastText}, url = {https://service.tib.eu/ldmservice/dataset/fasttext}, year = {2024} }