Dataset Groups Activity Stream Grid World The dataset used in the paper is a reinforcement learning dataset, specifically a Markov Decision Process (MDP) with a finite set of states and actions. BibTex: @dataset{Andrew_Cohen_and_Lei_Yu_and_Robert_Wright_2025, abstract = {The dataset used in the paper is a reinforcement learning dataset, specifically a Markov Decision Process (MDP) with a finite set of states and actions.}, author = {Andrew Cohen and Lei Yu and Robert Wright}, doi = {10.57702/smu7zene}, institution = {No Organization}, keyword = {'Grid World', 'Markov Decision Process', 'Reinforcement Learning', 'grid world', 'reinforcement learning', 'uncertainty'}, month = {jan}, publisher = {TIB}, title = {Grid World}, url = {https://service.tib.eu/ldmservice/dataset/grid-world}, year = {2025} }