Dataset Groups Activity Stream Multi-clue-TSE-data A multi-modal target sound extraction dataset based on public corpora, Audioset and AudioCaps. BibTex: @dataset{Chenda_Li_and_Yao_Qian_and_Zhuo_Chen_and_Dongmei_Wang_and_Takuya_Yoshioka_and_Shujie_Liu_and_Yanmin_Qian_and_Michael_Zeng_2025, abstract = {A multi-modal target sound extraction dataset based on public corpora, Audioset and AudioCaps.}, author = {Chenda Li and Yao Qian and Zhuo Chen and Dongmei Wang and Takuya Yoshioka and Shujie Liu and Yanmin Qian and Michael Zeng}, doi = {10.57702/1o7aiato}, institution = {No Organization}, keyword = {'audio processing', 'machine learning', 'multi-modal', 'target sound extraction'}, month = {jan}, publisher = {TIB}, title = {Multi-clue-TSE-data}, url = {https://service.tib.eu/ldmservice/dataset/multi-clue-tse-data}, year = {2025} }