f | { | f | { |
| "access_rights": "", | | "access_rights": "", |
n | "author": "Jun Yu", | n | "author": "Marc Tanti", |
| "author_email": "", | | "author_email": "", |
| "citation": [ | | "citation": [ |
n | "https://doi.org/10.18653/v1/D19-5627" | n | "https://doi.org/10.48550/arXiv.1712.02051", |
| | | "https://doi.org/10.48550/arXiv.1710.02534", |
| | | "https://doi.org/10.48550/arXiv.2304.02828", |
| | | "https://doi.org/10.48550/arXiv.2110.01705", |
| | | "https://doi.org/10.48550/arXiv.2101.09698", |
| | | "https://doi.org/10.48550/arXiv.1704.02798", |
| | | "https://doi.org/10.48550/arXiv.2210.12417", |
| | | "https://doi.org/10.48550/arXiv.1809.04144", |
| | | "https://doi.org/10.48550/arXiv.2405.16759", |
| | | "https://doi.org/10.48550/arXiv.2402.18969", |
| | | "https://doi.org/10.48550/arXiv.2402.15276", |
| | | "https://doi.org/10.48550/arXiv.2008.11073", |
| | | "https://doi.org/10.48550/arXiv.1811.04697", |
| | | "https://doi.org/10.1007/978-3-030-11018-5_11", |
| | | "https://doi.org/10.48550/arXiv.1903.02499", |
| | | "https://doi.org/10.1016/j.aiopen.2023.05.001", |
| | | "https://doi.org/10.48550/arXiv.1812.00235", |
| | | "https://doi.org/10.48550/arXiv.2404.03518", |
| | | "https://doi.org/10.48550/arXiv.2010.04963", |
| | | "https://doi.org/10.48550/arXiv.2306.07490", |
| | | "https://doi.org/10.48550/arXiv.2110.02623", |
| | | "https://doi.org/10.48550/arXiv.2006.11807", |
| | | "https://doi.org/10.48550/arXiv.2105.03889", |
| | | "https://doi.org/10.48550/arXiv.2312.08865", |
| | | "https://doi.org/10.48550/arXiv.2206.00621", |
| | | "https://doi.org/10.48550/arXiv.1908.04919", |
| | | "https://doi.org/10.48550/arXiv.2211.15398", |
| | | "https://doi.org/10.48550/arXiv.2310.19654", |
| | | "https://doi.org/10.1145/3664647.3681076" |
| ], | | ], |
| "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", | | "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", |
n | "defined_in": "https://doi.org/10.48550/arXiv.1905.07841", | n | "defined_in": "https://doi.org/10.48550/arXiv.2403.03715", |
| "doi": "10.57702/xriudzva", | | "doi": "10.57702/xriudzva", |
| "doi_date_published": "2024-11-25", | | "doi_date_published": "2024-11-25", |
| "doi_publisher": "TIB", | | "doi_publisher": "TIB", |
| "doi_status": true, | | "doi_status": true, |
| "domain": "https://service.tib.eu/ldmservice", | | "domain": "https://service.tib.eu/ldmservice", |
| "extra_authors": [ | | "extra_authors": [ |
| { | | { |
n | "extra_author": "Jing Li", | n | "extra_author": "Albert Gatt", |
| "orcid": "" | | "orcid": "" |
| }, | | }, |
| { | | { |
n | "extra_author": "Zhou Yu", | n | "extra_author": "Adrian Muscat", |
| "orcid": "" | | |
| }, | | |
| { | | |
| "extra_author": "Qingming Huang", | | |
| "orcid": "" | | "orcid": "" |
| } | | } |
| ], | | ], |
n | "groups": [], | n | "groups": [ |
| | | { |
| | | "description": "", |
| | | "display_name": "Human Attention", |
| | | "id": "03d143ba-0aca-42fc-9bee-d96f37b72948", |
| | | "image_display_url": "", |
| | | "name": "human-attention", |
| | | "title": "Human Attention" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Human Pose Estimation", |
| | | "id": "e880ba2e-3294-47ab-85b0-f66ba44b38bc", |
| | | "image_display_url": "", |
| | | "name": "human-pose-estimation", |
| | | "title": "Human Pose Estimation" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Captioning", |
| | | "id": "7a76ce67-2607-4da9-a837-d2017dc33ec6", |
| | | "image_display_url": "", |
| | | "name": "image-captioning", |
| | | "title": "Image Captioning" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Description", |
| | | "id": "8d6198ce-1f41-404e-b100-82cb5c33d3d2", |
| | | "image_display_url": "", |
| | | "name": "image-description", |
| | | "title": "Image Description" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Generation", |
| | | "id": "be25a76c-def1-4e73-8b1c-b81222d63867", |
| | | "image_display_url": "", |
| | | "name": "image-generation", |
| | | "title": "Image Generation" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image-Text Matching", |
| | | "id": "0635db3c-45c8-49b1-b083-80ec6966b144", |
| | | "image_display_url": "", |
| | | "name": "image-text-matching", |
| | | "title": "Image-Text Matching" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image-Text Retrieval", |
| | | "id": "28bbc5c8-e229-4df6-9cf1-d2040f80541a", |
| | | "image_display_url": "", |
| | | "name": "image-text-retrieval", |
| | | "title": "Image-Text Retrieval" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Images", |
| | | "id": "45883730-52c6-44ac-bea8-d50c9cbc8882", |
| | | "image_display_url": "", |
| | | "name": "images", |
| | | "title": "Images" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Instance Segmentation", |
| | | "id": "f856527a-3d35-4c73-8c09-bf3f4a3bbb9f", |
| | | "image_display_url": "", |
| | | "name": "instance-segmentation", |
| | | "title": "Instance Segmentation" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Multimodal Learning", |
| | | "id": "a88cb918-103d-4226-a87d-9d9103c1f839", |
| | | "image_display_url": "", |
| | | "name": "multimodal-learning", |
| | | "title": "Multimodal Learning" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Object Detection", |
| | | "id": "ca2cb1af-d31c-49b0-a1dd-62b22f2b9e20", |
| | | "image_display_url": "", |
| | | "name": "object-detection", |
| | | "title": "Object Detection" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Paraphrase Generation", |
| | | "id": "fdd2258a-e7c3-4fe5-b9bc-5005937d6431", |
| | | "image_display_url": "", |
| | | "name": "paraphrase-generation", |
| | | "title": "Paraphrase Generation" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Semantic Segmentation", |
| | | "id": "8c3f2eee-f5f9-464d-9c0a-1a5e7a925c0e", |
| | | "image_display_url": "", |
| | | "name": "semantic-segmentation", |
| | | "title": "Semantic Segmentation" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Text-to-Image", |
| | | "id": "c68d7763-4eaf-4b60-a763-d8a968e4245e", |
| | | "image_display_url": "", |
| | | "name": "text-to-image", |
| | | "title": "Text-to-Image" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Vision-and-Language Models", |
| | | "id": "8859491a-95fd-495f-9e99-91165571544a", |
| | | "image_display_url": "", |
| | | "name": "vision-and-language-models", |
| | | "title": "Vision-and-Language Models" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Visual Question Answering", |
| | | "id": "e15f82e8-481e-43a8-8a39-d6e0751ace6c", |
| | | "image_display_url": "", |
| | | "name": "visual-question-answering", |
| | | "title": "Visual Question Answering" |
| | | } |
| | | ], |
| "id": "b55ff6e8-0c5e-49c7-9281-f8b174aa09f3", | | "id": "b55ff6e8-0c5e-49c7-9281-f8b174aa09f3", |
| "isopen": false, | | "isopen": false, |
n | "landing_page": "https://cocodataset.org/", | n | "landing_page": "https://mscoco.org/", |
| "license_title": null, | | "license_title": null, |
| "link_orkg": "", | | "link_orkg": "", |
| "metadata_created": "2024-11-25T14:18:37.775582", | | "metadata_created": "2024-11-25T14:18:37.775582", |
n | "metadata_modified": "2024-11-25T14:31:47.455333", | n | "metadata_modified": "2024-12-02T17:38:59.395188", |
| "name": "mscoco", | | "name": "mscoco", |
n | "notes": "MSCOCO is a benchmark dataset for various computer vision | n | "notes": "Human Pose Estimation (HPE) aims to estimate the position |
| tasks, including object detection, instance segmentation, and image | | of each joint point of the human body in a given image. HPE tasks |
| captioning. It contains 83k training images, 40k validation images, | | support a wide range of downstream tasks such as activity recognition, |
| and 81k test images, each associated with five captions.", | | motion capture, etc. Recently with the ViT model being proven |
| | | effective on many visual tasks, many transformer-based methods have |
| | | achieved excellent performance on HPE tasks.", |
| "num_resources": 1, | | "num_resources": 0, |
| "num_tags": 0, | | "num_tags": 49, |
| "organization": { | | "organization": { |
| "approval_status": "approved", | | "approval_status": "approved", |
| "created": "2024-11-25T12:11:38.292601", | | "created": "2024-11-25T12:11:38.292601", |
| "description": "", | | "description": "", |
| "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "image_url": "", | | "image_url": "", |
| "is_organization": true, | | "is_organization": true, |
| "name": "no-organization", | | "name": "no-organization", |
| "state": "active", | | "state": "active", |
| "title": "No Organization", | | "title": "No Organization", |
| "type": "organization" | | "type": "organization" |
| }, | | }, |
| "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "private": false, | | "private": false, |
| "relationships_as_object": [], | | "relationships_as_object": [], |
| "relationships_as_subject": [], | | "relationships_as_subject": [], |
n | "resources": [ | n | "resources": [], |
| { | | "services_used_list": "", |
| "cache_last_updated": null, | | |
| "cache_url": null, | | |
| "created": "2024-11-25T15:30:26", | | |
| "data": [ | | |
| "dcterms:title", | | |
| "dcterms:accessRights", | | |
| "dcterms:creator", | | |
| "dcterms:description", | | |
| "dcterms:issued", | | |
| "dcterms:language", | | |
| "dcterms:identifier", | | |
| "dcat:theme", | | |
| "dcterms:type", | | |
| "dcat:keyword", | | |
| "dcat:landingPage", | | |
| "dcterms:hasVersion", | | |
| "dcterms:format", | | |
| "mls:task", | | |
| "datacite:isDescribedBy" | | |
| ], | | |
| "description": "The json representation of the dataset with its | | |
| distributions based on DCAT.", | | |
| "format": "JSON", | | |
| "hash": "", | | |
| "id": "df12f624-61cf-441a-af25-2d04f3fec39a", | | |
| "last_modified": "2024-11-25T14:31:47.447621", | | |
| "metadata_modified": "2024-11-25T14:31:47.458648", | | |
| "mimetype": "application/json", | | |
| "mimetype_inner": null, | | |
| "name": "Original Metadata", | | |
| "package_id": "b55ff6e8-0c5e-49c7-9281-f8b174aa09f3", | | |
| "position": 0, | | |
| "resource_type": null, | | |
| "size": 1076, | | |
| "state": "active", | | "state": "active", |
| "url": | | "tags": [ |
| resource/df12f624-61cf-441a-af25-2d04f3fec39a/download/metadata.json", | | { |
| "url_type": "upload" | | "display_name": "Captioning", |
| | | "id": "99ec7549-b23a-432e-88f4-803dd8685b2c", |
| | | "name": "Captioning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image Captioning", |
| | | "id": "c708cba4-0a1f-45c9-826f-898857783343", |
| | | "name": "Image Captioning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image Description", |
| | | "id": "d3ef3b7e-c8b4-4a5e-be62-11eed53a5567", |
| | | "name": "Image Description", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image Retrieval", |
| | | "id": "4b81e5bb-1f8f-415b-a688-0e2d94b6d499", |
| | | "name": "Image Retrieval", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image-Text Matching", |
| | | "id": "84540152-adb0-4565-a5c1-cf49882b8caa", |
| | | "name": "Image-Text Matching", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Images", |
| | | "id": "b653d5cb-88da-4373-ae34-3b0b41d37fad", |
| | | "name": "Images", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Instance Segmentation", |
| | | "id": "b58d8dfe-1216-401d-8a2a-ceb09e07a013", |
| | | "name": "Instance Segmentation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Japanese", |
| | | "id": "e7a703ef-c107-49e5-b9c8-5b9a109cf39b", |
| | | "name": "Japanese", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "MSCOCO", |
| | | "id": "1405508e-1059-4b81-93e7-bdb979347d50", |
| | | "name": "MSCOCO", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multimodal Learning", |
| | | "id": "41329983-d90e-4560-a97d-7fa2ba0a1f92", |
| | | "name": "Multimodal Learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Object Detection", |
| | | "id": "44adc011-570b-46cf-9a65-ab72ca690477", |
| | | "name": "Object Detection", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Semantic Segmentation", |
| | | "id": "809ad6af-28cd-43bd-974d-055a5c0f2973", |
| | | "name": "Semantic Segmentation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Visual Question Answering", |
| | | "id": "d8aee55f-7e04-411f-8ce5-0794bc0406b0", |
| | | "name": "Visual Question Answering", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Weakly Supervised Learning", |
| | | "id": "3bf0db7d-8b83-4928-bc08-62c0e97f7dfd", |
| | | "name": "Weakly Supervised Learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "computer vision", |
| | | "id": "f650b4e3-9955-49b0-ba7b-2d302a990978", |
| | | "name": "computer vision", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "dataset", |
| | | "id": "ce5ad030-ca3d-47e6-abd1-5c92a2806f1b", |
| | | "name": "dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "diffusion models", |
| | | "id": "67686580-d41a-4e00-875a-494e99951342", |
| | | "name": "diffusion models", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "gender", |
| | | "id": "af90adbe-d62d-4309-ba7b-132696a7db64", |
| | | "name": "gender", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "human attention", |
| | | "id": "a4f7720f-dbdc-4830-a369-dacf1fd59bc9", |
| | | "name": "human attention", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "human pose estimation", |
| | | "id": "2ba9bb7a-941e-4f02-8376-06b50691a7dd", |
| | | "name": "human pose estimation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image captioning", |
| | | "id": "f1bbe827-a03a-4280-b9fa-0599ccfc0541", |
| | | "name": "image captioning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image classification", |
| | | "id": "34936550-ce1a-41b5-8c58-23081a6c673d", |
| | | "name": "image classification", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image dataset", |
| | | "id": "d3acafab-ad07-46a1-88d5-540c2fd41466", |
| | | "name": "image dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image description", |
| | | "id": "99e3a7d7-7ee7-4f66-adf4-28ac19f60923", |
| | | "name": "image description", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image generation", |
| | | "id": "96df81b4-32fd-4826-a903-affb005a0a60", |
| | | "name": "image generation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image processing", |
| | | "id": "12b6291b-2e80-4736-935f-cc942880df77", |
| | | "name": "image processing", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image-text matching", |
| | | "id": "75c56b7d-ab6b-4dd8-88f8-67e92928dca0", |
| | | "name": "image-text matching", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image-text pairs", |
| | | "id": "07cb3691-65c6-4b58-b3bf-5290980a86e3", |
| | | "name": "image-text pairs", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image-text retrieval", |
| | | "id": "2ce62fa7-a31e-4be3-9312-92be69a8726b", |
| | | "name": "image-text retrieval", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "key-point based object detection", |
| | | "id": "510e6689-8d4d-4eee-9fbb-6c0d8f8c9ae9", |
| | | "name": "key-point based object detection", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "large-scale dataset", |
| | | "id": "a9c694bf-f591-4625-a20e-d53d3f90d489", |
| | | "name": "large-scale dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "natural descriptions", |
| | | "id": "cc6fad82-69e6-4d60-bf91-fcb10fc975e1", |
| | | "name": "natural descriptions", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "natural language processing", |
| | | "id": "8af9c93a-1d87-41e0-83d9-f5d01a2bbd0c", |
| | | "name": "natural language processing", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "neural networks", |
| | | "id": "8ef5d32b-4073-4531-87bc-4b4676fd22b8", |
| | | "name": "neural networks", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "non-autoregressive", |
| | | "id": "a65d259a-0ed2-4b9f-b3cd-fc666dd6c6a5", |
| | | "name": "non-autoregressive", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "object detection", |
| | | "id": "607283c7-9e12-4167-9101-7f8078fb6537", |
| | | "name": "object detection", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "paraphrase generation", |
| | | "id": "32754920-b11e-4892-b082-84ade55232ba", |
| | | "name": "paraphrase generation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "sequence generation", |
| | | "id": "92c922a0-5cdc-48db-be04-ea01a0fba058", |
| | | "name": "sequence generation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "single-shot detectors", |
| | | "id": "714b183c-81a8-4198-bbd1-46ed5cda6f29", |
| | | "name": "single-shot detectors", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "skin-tone", |
| | | "id": "6687fb65-1ff2-43c4-944f-ea24297837f4", |
| | | "name": "skin-tone", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "synthetic pairs", |
| | | "id": "1aa7c615-584c-4798-8b2f-00cdfe43ae84", |
| | | "name": "synthetic pairs", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "text-only", |
| | | "id": "ef11147f-7893-48cd-adf6-414d9f971718", |
| | | "name": "text-only", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "text-to-image", |
| | | "id": "0b0e2f9a-321b-4b04-abc6-14130f66400c", |
| | | "name": "text-to-image", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "vision-and-language models", |
| | | "id": "7645deef-42d9-4294-a894-9829f9c04122", |
| | | "name": "vision-and-language models", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "vision-language pre-training", |
| | | "id": "fd01e9f9-7fca-46ce-83d8-ff81c76d8e7a", |
| | | "name": "vision-language pre-training", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "visual language grounding", |
| | | "id": "d2b22694-0a09-4953-9275-2ed27bfbab03", |
| | | "name": "visual language grounding", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "visual question answering", |
| | | "id": "8be24887-e029-464f-b56c-1d0a460e2005", |
| | | "name": "visual question answering", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "visual relationship detection", |
| | | "id": "e1f83c99-b862-498b-b955-ee73b1648e6f", |
| | | "name": "visual relationship detection", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "visual-textual embedding", |
| | | "id": "6ee32e99-b284-45d5-aeaf-59560d8ef3bb", |
| | | "name": "visual-textual embedding", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| } | | } |
| ], | | ], |
t | "services_used_list": "", | t | |
| "state": "active", | | |
| "tags": [], | | |
| "title": "MSCOCO", | | "title": "MSCOCO", |
| "type": "dataset", | | "type": "dataset", |
| "version": "" | | "version": "" |
| } | | } |