Dataset Groups Activity Stream Interactive Scoring IRL The dataset used in the paper is a set of trajectories and scores provided by human teachers to train a behavioral policy in a sparse reward environment. BibTex: @dataset{Shukai_Liu_and_Chenming_Wu_and_Ying_Li_and_Liangjun_Zhang_2024, abstract = {The dataset used in the paper is a set of trajectories and scores provided by human teachers to train a behavioral policy in a sparse reward environment.}, author = {Shukai Liu and Chenming Wu and Ying Li and Liangjun Zhang}, doi = {10.57702/c3yk3v1d}, institution = {No Organization}, keyword = {'Policy Learning', 'Reward Function', 'Scores', 'Trajectories'}, month = {dec}, publisher = {TIB}, title = {Interactive Scoring IRL}, url = {https://service.tib.eu/ldmservice/dataset/interactive-scoring-irl}, year = {2024} }