Dataset Groups Activity Stream Chain MDP The dataset used in the Generative Adversarial Exploration for Reinforcement Learning paper. BibTex: @dataset{Weijun_Hong_and_Weinan_Zhang_and_Menghui_Zhu_and_Ming_Zhou_and_Peng_Sun_and_Minghuan_Liu_and_Yong_Yu_2024, abstract = {The dataset used in the Generative Adversarial Exploration for Reinforcement Learning paper.}, author = {Weijun Hong and Weinan Zhang and Menghui Zhu and Ming Zhou and Peng Sun and Minghuan Liu and Yong Yu}, doi = {10.57702/p0xy3z4u}, institution = {No Organization}, keyword = {'Exploration', 'Markov Decision Process', 'Reinforcement Learning'}, month = {dec}, publisher = {TIB}, title = {Chain MDP}, url = {https://service.tib.eu/ldmservice/dataset/chain-mdp}, year = {2024} }