Dataset Groups Activity Stream FIT: Far-reaching Interleaved Transformers We present FIT: a transformer-based architecture with efficient self-attention and adaptive computation. BibTex: @dataset{Ting_Chen_and_Lala_Li_2024, abstract = {We present FIT: a transformer-based architecture with efficient self-attention and adaptive computation.}, author = {Ting Chen and Lala Li}, doi = {10.57702/gnm0np91}, institution = {No Organization}, keyword = {'image generation', 'image understanding', 'transformer-based architecture'}, month = {dec}, publisher = {TIB}, title = {FIT: Far-reaching Interleaved Transformers}, url = {https://service.tib.eu/ldmservice/dataset/fit--far-reaching-interleaved-transformers}, year = {2024} }