Dataset Groups Activity Stream Audio Visual Scene-aware Dialog dataset The Audio Visual Scene-aware Dialog (AVSD) dataset requires systems to generate answers about events observed in a video through previous dialogs. BibTex: @dataset{C_Hori_and_H_Alamri_and_J_Wang_and_G_Wichern_and_T_Hori_and_A_Cherian_and_TK_Marks_and_V_Cartillier_and_RG_Lopes_and_A_Das_2024, abstract = {The Audio Visual Scene-aware Dialog (AVSD) dataset requires systems to generate answers about events observed in a video through previous dialogs.}, author = {C. Hori and H. Alamri and J. Wang and G. Wichern and T. Hori and A. Cherian and T.K. Marks and V. Cartillier and R.G. Lopes and A. Das}, doi = {10.57702/b2ugxqvi}, institution = {No Organization}, month = {nov}, publisher = {TIB}, title = {Audio Visual Scene-aware Dialog dataset}, url = {https://service.tib.eu/ldmservice/dataset/audio-visual-scene-aware-dialog-dataset}, year = {2024} }