Dataset Groups Activity Stream RefCOCO The dataset used in the paper is a benchmark for referring expression grounding, containing 142,210 referring expressions for 50,000 referents in 19,994 images. BibTex: @dataset{Licheng_Yu_and_Patrick_Poirson_and_Shan_Yang_and_Alexander_C_Berg_and_Tamara_L_Berg_2024, abstract = {The dataset used in the paper is a benchmark for referring expression grounding, containing 142,210 referring expressions for 50,000 referents in 19,994 images.}, author = {Licheng Yu and Patrick Poirson and Shan Yang and Alexander C Berg and Tamara L Berg}, doi = {10.57702/w4gv8oxb}, institution = {No Organization}, keyword = {'Keypoint detection', 'Language Understanding', 'Object Detection', 'Object detection', 'RefCOCO', 'Referring Expression Recognition', 'Referring Image Segmentation', 'Segmentation', 'benchmark', 'grounding', 'image annotation', 'image segmentation', 'natural language processing', 'object detection', 'refcoco', 'referencing', 'referring expressions', 'visual grounding'}, month = {dec}, publisher = {TIB}, title = {RefCOCO}, url = {https://service.tib.eu/ldmservice/dataset/refcoco}, year = {2024} }