Dataset Groups Activity Stream RWAVS Real-world Audio-Visual Scene (RWAVS) dataset offers realistic multi-modal training samples constituting camera poses, high-quality binaural audios, and images. BibTex: @dataset{Swapnil_Bhosale_and_Haosen_Yang_and_Diptesh_Kanojia_and_Jiankang_Deng_and_Xiatian_Zhu_2024, abstract = {Real-world Audio-Visual Scene (RWAVS) dataset offers realistic multi-modal training samples constituting camera poses, high-quality binaural audios, and images.}, author = {Swapnil Bhosale and Haosen Yang and Diptesh Kanojia and Jiankang Deng and Xiatian Zhu}, doi = {10.57702/jlung6ee}, institution = {No Organization}, keyword = {'Audio-Visual Scene Synthesis', 'Binaural Audio Synthesis', 'Real-World Dataset'}, month = {dec}, publisher = {TIB}, title = {RWAVS}, url = {https://service.tib.eu/ldmservice/dataset/rwavs}, year = {2024} }