Dataset Groups Activity Stream Gridworld Dataset The dataset used for the Gridworld tasks, consisting of 10K episodes of the agent following a uniform random policy. BibTex: @dataset{James_McCarthy_and_Rahul_Nair_and_Elizabeth_Daly_and_Radu_Marinescu_and_Ivana_Dusparic_2024, abstract = {The dataset used for the Gridworld tasks, consisting of 10K episodes of the agent following a uniform random policy.}, author = {James McCarthy and Rahul Nair and Elizabeth Daly and Radu Marinescu and Ivana Dusparic}, doi = {10.57702/8t5d6vj4}, institution = {No Organization}, keyword = {'DQN policy', 'Discrete Actions', 'Gridworld', 'Reinforcement Learning', 'gridworld', 'state-action pairs'}, month = {dec}, publisher = {TIB}, title = {Gridworld Dataset}, url = {https://service.tib.eu/ldmservice/dataset/gridworld-dataset}, year = {2024} }