Dataset Groups Activity Stream Cross-modal and hierarchical modeling of video and text Cross-modal and hierarchical modeling of video and text. BibTex: @dataset{Hang_Hua_and_Xingjian_Li_and_Dejing_Dou_and_Cheng-Zhong_Xu_and_Jiebo_Luo_2024, abstract = {Cross-modal and hierarchical modeling of video and text.}, author = {Hang Hua and Xingjian Li and Dejing Dou and Cheng-Zhong Xu and Jiebo Luo}, doi = {10.57702/9eiz0fzs}, institution = {No Organization}, keyword = {'cross-modal summarization', 'hierarchical modeling'}, month = {dec}, publisher = {TIB}, title = {Cross-modal and hierarchical modeling of video and text}, url = {https://service.tib.eu/ldmservice/dataset/cross-modal-and-hierarchical-modeling-of-video-and-text}, year = {2024} }