Dataset Groups Activity Stream Vggsound: A large-scale audio-visual dataset A large-scale audio-visual dataset containing audio-visual pairs. BibTex: @dataset{Honglie_Chen_and_Weidi_Xie_and_Triantafyllos_Afouras_and_Arsha_Nagraani_and_Andrea_Vedaldi_and_Andrew_Zisserman_2024, abstract = {A large-scale audio-visual dataset containing audio-visual pairs.}, author = {Honglie Chen and Weidi Xie and Triantafyllos Afouras and Arsha Nagraani and Andrea Vedaldi and Andrew Zisserman}, doi = {10.57702/cudxhw85}, institution = {No Organization}, keyword = {'audio-visual', 'dataset', 'large-scale'}, month = {dec}, publisher = {TIB}, title = {Vggsound: A large-scale audio-visual dataset}, url = {https://service.tib.eu/ldmservice/dataset/vggsound--a-large-scale-audio-visual-dataset}, year = {2024} }