Dataset Groups Activity Stream Noisy MNIST The MNIST environment does not elicit any actions from an agent. Instead, the prediction network simply needs to learn one step mappings between pairs of MNIST handwritten digits. BibTex: @dataset{Augustine_N_Mavor-Parker_and_Kimberly_A_Young_and_Caswell_Barry_and_Lewis_D_Griffin_2024, abstract = {The MNIST environment does not elicit any actions from an agent. Instead, the prediction network simply needs to learn one step mappings between pairs of MNIST handwritten digits.}, author = {Augustine N. Mavor-Parker and Kimberly A. Young and Caswell Barry and Lewis D. Griffin}, doi = {10.57702/kvnobzaf}, institution = {No Organization}, keyword = {'MNIST', 'Noisy MNIST', 'Reinforcement Learning'}, month = {dec}, publisher = {TIB}, title = {Noisy MNIST}, url = {https://service.tib.eu/ldmservice/dataset/noisy-mnist}, year = {2024} }