Dataset Groups Activity Stream SMM dataset The dataset used in the paper is a collection of states sampled from a Markov Decision Process (MDP) using the SMM exploration method. BibTex: @dataset{Alexis_Jacq_and_Manu_Orsini_and_Gabriel_Dulac-Arnold_and_Olivier_Pietquin_and_Matthieu_Geist_and_Olivier_Bachem_2024, abstract = {The dataset used in the paper is a collection of states sampled from a Markov Decision Process (MDP) using the SMM exploration method.}, author = {Alexis Jacq and Manu Orsini and Gabriel Dulac-Arnold and Olivier Pietquin and Matthieu Geist and Olivier Bachem}, doi = {10.57702/o25vxt9l}, institution = {No Organization}, keyword = {'Exploration', 'MDP', 'Reinforcement Learning', 'SMM'}, month = {dec}, publisher = {TIB}, title = {SMM dataset}, url = {https://service.tib.eu/ldmservice/dataset/smm-dataset}, year = {2024} }