Dataset Groups Activity Stream Reinforcement Re-ranking with 2D Grid-based Recommendation Panels A novel Markov decision process (MDP)-based re-ranking model for final-stage recommendation, called Panel-MDP. BibTex: @dataset{Xiao_Zhang_and_Xu_Chen_and_Sirui_Chen_and_Zhiyu_Li_and_Yuan_Wang_and_Quan_Lin_and_Jun_Xu_2024, abstract = {A novel Markov decision process (MDP)-based re-ranking model for final-stage recommendation, called Panel-MDP.}, author = {Xiao Zhang and Xu Chen and Sirui Chen and Zhiyu Li and Yuan Wang and Quan Lin and Jun Xu}, doi = {10.57702/4j50d4qz}, institution = {No Organization}, keyword = {'2D Grid-based Recommendation Panels', 'Recommendation Systems', 'Reinforcement Learning'}, month = {dec}, publisher = {TIB}, title = {Reinforcement Re-ranking with 2D Grid-based Recommendation Panels}, url = {https://service.tib.eu/ldmservice/dataset/reinforcement-re-ranking-with-2d-grid-based-recommendation-panels}, year = {2024} }