Dataset Groups Activity Stream Sparse-MLP Mixture-of-Experts (MoE) architecture, conditional computing, cross-token modeling, Sparse-MLP model BibTex: @dataset{Yuxuan_Lou_and_Fuzhao_Xue_and_Zangwei_Zheng_and_Yang_You_2024, abstract = {Mixture-of-Experts (MoE) architecture, conditional computing, cross-token modeling, Sparse-MLP model}, author = {Yuxuan Lou and Fuzhao Xue and Zangwei Zheng and Yang You}, doi = {10.57702/02fcg827}, institution = {No Organization}, keyword = {'Conditional computing', 'Cross-token modeling', 'MoE', 'Sparse-MLP'}, month = {dec}, publisher = {TIB}, title = {Sparse-MLP}, url = {https://service.tib.eu/ldmservice/dataset/sparse-mlp}, year = {2024} }