Dataset Groups Activity Stream Random Walk dataset The dataset used in the paper is a collection of states sampled from a Markov Decision Process (MDP) using the random walk exploration method. BibTex: @dataset{Alexis_Jacq_and_Manu_Orsini_and_Gabriel_Dulac-Arnold_and_Olivier_Pietquin_and_Matthieu_Geist_and_Olivier_Bachem_2024, abstract = {The dataset used in the paper is a collection of states sampled from a Markov Decision Process (MDP) using the random walk exploration method.}, author = {Alexis Jacq and Manu Orsini and Gabriel Dulac-Arnold and Olivier Pietquin and Matthieu Geist and Olivier Bachem}, doi = {10.57702/bpx1qazg}, institution = {No Organization}, keyword = {'Exploration', 'MDP', 'Random Walk', 'Reinforcement Learning'}, month = {dec}, publisher = {TIB}, title = {Random Walk dataset}, url = {https://service.tib.eu/ldmservice/dataset/random-walk-dataset}, year = {2024} }