Dataset Groups Activity Stream ReferIt Referring image segmentation aims at localizing all pixels of the visual objects described by a natural language sentence. BibTex: @dataset{Zicheng_Zhang_and_Yi_Zhu_and_Jianzhuang_Liu_and_Xiaodan_Liang_and_Wei_Ke_2024, abstract = {Referring image segmentation aims at localizing all pixels of the visual objects described by a natural language sentence.}, author = {Zicheng Zhang and Yi Zhu and Jianzhuang Liu and Xiaodan Liang and Wei Ke}, doi = {10.57702/14u0zl22}, institution = {No Organization}, keyword = {'Object Detection', 'Referring Image Segmentation', 'image captioning', 'referencing', 'visual grounding'}, month = {dec}, publisher = {TIB}, title = {ReferIt}, url = {https://service.tib.eu/ldmservice/dataset/referit}, year = {2024} }