Dataset Groups Activity Stream Ref-Youtube-VOS Ref-Youtube-VOS is an extensive referring video object segmentation dataset that comprises approximately 15,000 referring expressions associated with more than 3,900 videos. BibTex: @dataset{Zhuoyan_Luo_and_Yicheng_Xiao_and_Yong_Liu_and_Yitong_Wang_and_Yansong_Tang_and_Xiu_Li_and_Yujiu_Yang_2024, abstract = {Ref-Youtube-VOS is an extensive referring video object segmentation dataset that comprises approximately 15,000 referring expressions associated with more than 3,900 videos.}, author = {Zhuoyan Luo and Yicheng Xiao and Yong Liu and Yitong Wang and Yansong Tang and Xiu Li and Yujiu Yang}, doi = {10.57702/pomnivcs}, institution = {No Organization}, keyword = {'Language Understanding', 'RVOS', 'Referring Video Object Segmentation', 'Segmentation', 'Video Object Segmentation'}, month = {dec}, publisher = {TIB}, title = {Ref-Youtube-VOS}, url = {https://service.tib.eu/ldmservice/dataset/ref-youtube-vos}, year = {2024} }