f | { | f | { |
| "access_rights": "", | | "access_rights": "", |
n | "author": "Jiafeng Mao", | n | "author": "Kun. Zhang", |
| "author_email": "", | | "author_email": "", |
| "citation": [ | | "citation": [ |
n | "https://doi.org/10.48550/arXiv.2304.13427", | n | "https://doi.org/10.48550/arXiv.2403.14944", |
| "https://doi.org/10.48550/arXiv.2205.09613", | | |
| "https://doi.org/10.48550/arXiv.2212.07629", | | "https://doi.org/10.1609/aaai.v38i5.28227", |
| "https://doi.org/10.48550/arXiv.2208.00817", | | |
| "https://doi.org/10.48550/arXiv.2111.02042", | | |
| "https://doi.org/10.48550/arXiv.2110.09779", | | |
| "https://doi.org/10.48550/arXiv.2406.05120", | | "https://doi.org/10.48550/arXiv.2406.11100", |
| "https://doi.org/10.48550/arXiv.1805.11850", | | "https://doi.org/10.1109/TIP.2021.3088605", |
| "https://doi.org/10.1561/116.00000057", | | |
| "https://doi.org/10.48550/arXiv.1505.01173", | | |
| "https://doi.org/10.48550/arXiv.2002.01205", | | "https://doi.org/10.48550/arXiv.2002.08510", |
| "https://doi.org/10.48550/arXiv.2201.09774", | | |
| "https://doi.org/10.1016/j.neucom.2024.127376", | | |
| "https://doi.org/10.48550/arXiv.2003.07516", | | |
| "https://doi.org/10.1016/j.patcog.2022.109018", | | |
| "https://doi.org/10.48550/arXiv.2208.09374", | | |
| "https://doi.org/10.48550/arXiv.2311.08223", | | |
| "https://doi.org/10.48550/arXiv.2304.04978", | | |
| "https://doi.org/10.48550/arXiv.1904.07642", | | "https://doi.org/10.48550/arXiv.1909.02622", |
| "https://doi.org/10.48550/arXiv.2004.04320", | | "https://doi.org/10.48550/arXiv.2212.10431", |
| "https://doi.org/10.48550/arXiv.2205.00363", | | |
| "https://doi.org/10.48550/arXiv.2311.14435", | | |
| "https://doi.org/10.48550/arXiv.1807.03470", | | "https://doi.org/10.48550/arXiv.1808.04537", |
| | | "https://doi.org/10.48550/arXiv.2307.15710", |
| | | "https://doi.org/10.48550/arXiv.1908.03675", |
| | | "https://doi.org/10.48550/arXiv.1612.03557", |
| | | "https://doi.org/10.48550/arXiv.1810.04101", |
| | | "https://doi.org/10.48550/arXiv.2303.12419", |
| | | "https://doi.org/10.48550/arXiv.2306.16805", |
| | | "https://doi.org/10.48550/arXiv.1802.09129", |
| | | "https://doi.org/10.48550/arXiv.2202.05451", |
| | | "https://doi.org/10.48550/arXiv.2305.04170", |
| | | "https://doi.org/10.48550/arXiv.2010.11686", |
| | | "https://doi.org/10.48550/arXiv.2407.12291", |
| "https://doi.org/10.48550/arXiv.2312.01987", | | "https://doi.org/10.48550/arXiv.2312.03517", |
| | | "https://doi.org/10.48550/arXiv.2305.11213", |
| | | "https://doi.org/10.48550/arXiv.2208.04060", |
| "https://doi.org/10.48550/arXiv.1901.00148", | | "https://doi.org/10.48550/arXiv.1711.08174", |
| | | "https://doi.org/10.48550/arXiv.2108.02456", |
| "https://doi.org/10.48550/arXiv.2307.08198", | | "https://doi.org/10.48550/arXiv.2305.01586", |
| "https://doi.org/10.48550/arXiv.1807.09434", | | "https://doi.org/10.48550/arXiv.2208.06140", |
| "https://doi.org/10.48550/arXiv.2209.12599", | | "https://doi.org/10.48550/arXiv.2009.14119", |
| "https://doi.org/10.48550/arXiv.1805.07009", | | |
| "https://doi.org/10.48550/arXiv.2101.00989", | | "https://doi.org/10.48550/arXiv.2011.00869", |
| "https://doi.org/10.48550/arXiv.2407.18559", | | "https://doi.org/10.48550/arXiv.2203.15859", |
| | | "https://doi.org/10.48550/arXiv.2106.06509", |
| | | "https://doi.org/10.1007/978-3-030-69535-4_7", |
| | | "https://doi.org/10.48550/arXiv.2306.04744", |
| | | "https://doi.org/10.48550/arXiv.2405.11574", |
| "https://doi.org/10.48550/arXiv.2302.03668" | | "https://doi.org/10.48550/arXiv.2303.08360", |
| | | "https://doi.org/10.1109/TPAMI.2021.3121705", |
| | | "https://doi.org/10.48550/arXiv.2204.08945", |
| | | "https://doi.org/10.48550/arXiv.2301.10051" |
| ], | | ], |
| "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", | | "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", |
n | "defined_in": "https://doi.org/10.48550/arXiv.2402.09315", | n | "defined_in": "https://doi.org/10.48550/arXiv.1812.02378", |
| "doi": "10.57702/d0h8si72", | | "doi": "10.57702/d0h8si72", |
| "doi_date_published": "2024-11-25", | | "doi_date_published": "2024-11-25", |
| "doi_publisher": "TIB", | | "doi_publisher": "TIB", |
| "doi_status": true, | | "doi_status": true, |
| "domain": "https://service.tib.eu/ldmservice", | | "domain": "https://service.tib.eu/ldmservice", |
| "extra_authors": [ | | "extra_authors": [ |
| { | | { |
n | | n | "extra_author": "Peng He", |
| | | "orcid": "" |
| | | }, |
| | | { |
| "extra_author": "Xueting Wang", | | "extra_author": "Ping Yao", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Ge Chen", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Rui Wu", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Min Du", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Huimin Li", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Li Fu", |
| | | "orcid": "" |
| | | }, |
| | | { |
| | | "extra_author": "Tianyao Zheng", |
| "orcid": "" | | "orcid": "" |
| } | | } |
| ], | | ], |
| "groups": [ | | "groups": [ |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Computer Vision", | | "display_name": "Computer Vision", |
| "id": "d09caf7c-26c7-4e4d-bb8e-49476a90ba25", | | "id": "d09caf7c-26c7-4e4d-bb8e-49476a90ba25", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "computer-vision", | | "name": "computer-vision", |
| "title": "Computer Vision" | | "title": "Computer Vision" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | | n | "display_name": "Cross-Modal Retrieval", |
| | | "id": "b9260717-40f6-4757-aba5-2be43503938d", |
| | | "image_display_url": "", |
| | | "name": "cross-modal-retrieval", |
| | | "title": "Cross-Modal Retrieval" |
| | | }, |
| | | { |
| | | "description": "", |
| "display_name": "Human Pose Estimation", | | "display_name": "Human Pose Estimation", |
| "id": "e880ba2e-3294-47ab-85b0-f66ba44b38bc", | | "id": "e880ba2e-3294-47ab-85b0-f66ba44b38bc", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "human-pose-estimation", | | "name": "human-pose-estimation", |
| "title": "Human Pose Estimation" | | "title": "Human Pose Estimation" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Image Captioning", | | "display_name": "Image Captioning", |
| "id": "7a76ce67-2607-4da9-a837-d2017dc33ec6", | | "id": "7a76ce67-2607-4da9-a837-d2017dc33ec6", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "image-captioning", | | "name": "image-captioning", |
| "title": "Image Captioning" | | "title": "Image Captioning" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Image Classification", | | "display_name": "Image Classification", |
| "id": "18b77292-26aa-4caf-89ed-cbd35fa60474", | | "id": "18b77292-26aa-4caf-89ed-cbd35fa60474", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "image-classification", | | "name": "image-classification", |
| "title": "Image Classification" | | "title": "Image Classification" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | | n | "display_name": "Image Compression", |
| | | "id": "094941e1-ba8a-4742-a18e-4da139345758", |
| | | "image_display_url": "", |
| | | "name": "image-compression", |
| | | "title": "Image Compression" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Dataset", |
| | | "id": "fc745cca-b21e-4ced-ba81-06a456938edf", |
| | | "image_display_url": "", |
| | | "name": "image-dataset", |
| | | "title": "Image Dataset" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Generation", |
| | | "id": "be25a76c-def1-4e73-8b1c-b81222d63867", |
| | | "image_display_url": "", |
| | | "name": "image-generation", |
| | | "title": "Image Generation" |
| | | }, |
| | | { |
| | | "description": "", |
| "display_name": "Image Recognition", | | "display_name": "Image Recognition", |
| "id": "42c0f83b-b61c-4bbd-a704-133e4e4a0c15", | | "id": "42c0f83b-b61c-4bbd-a704-133e4e4a0c15", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "image-recognition", | | "name": "image-recognition", |
| "title": "Image Recognition" | | "title": "Image Recognition" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Image Segmentation", | | "display_name": "Image Segmentation", |
| "id": "7c8cc5f1-a9b2-4924-82ec-9e3aa3049a04", | | "id": "7c8cc5f1-a9b2-4924-82ec-9e3aa3049a04", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "image-segmentation", | | "name": "image-segmentation", |
| "title": "Image Segmentation" | | "title": "Image Segmentation" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | | n | "display_name": "Image Style Transfer", |
| | | "id": "c4992a33-c638-471f-8f28-f54ff55fbc32", |
| | | "image_display_url": "", |
| | | "name": "image-style-transfer", |
| | | "title": "Image Style Transfer" |
| | | }, |
| | | { |
| | | "description": "", |
| "display_name": "Image Understanding", | | "display_name": "Image-Text Matching", |
| "id": "638a25dd-1bfb-497e-89d2-287a377aa4f6", | | "id": "0635db3c-45c8-49b1-b083-80ec6966b144", |
| "image_display_url": "", | | "image_display_url": "", |
n | "name": "image-understanding", | n | "name": "image-text-matching", |
| "title": "Image Understanding" | | "title": "Image-Text Matching" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Image-Text Retrieval", | | "display_name": "Image-Text Retrieval", |
| "id": "28bbc5c8-e229-4df6-9cf1-d2040f80541a", | | "id": "28bbc5c8-e229-4df6-9cf1-d2040f80541a", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "image-text-retrieval", | | "name": "image-text-retrieval", |
| "title": "Image-Text Retrieval" | | "title": "Image-Text Retrieval" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Instance Segmentation", | | "display_name": "Instance Segmentation", |
| "id": "f856527a-3d35-4c73-8c09-bf3f4a3bbb9f", | | "id": "f856527a-3d35-4c73-8c09-bf3f4a3bbb9f", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "instance-segmentation", | | "name": "instance-segmentation", |
| "title": "Instance Segmentation" | | "title": "Instance Segmentation" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | | n | "display_name": "Multi-Label Classification", |
| | | "id": "6f9e0de4-7c26-404c-af3c-2f4cca3ff39b", |
| | | "image_display_url": "", |
| | | "name": "multi-label-classification", |
| | | "title": "Multi-Label Classification" |
| | | }, |
| | | { |
| | | "description": "", |
| "display_name": "Object Detection", | | "display_name": "Object Detection", |
| "id": "ca2cb1af-d31c-49b0-a1dd-62b22f2b9e20", | | "id": "ca2cb1af-d31c-49b0-a1dd-62b22f2b9e20", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "object-detection", | | "name": "object-detection", |
| "title": "Object Detection" | | "title": "Object Detection" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | "display_name": "Object Segmentation", | n | "display_name": "Semantic Compression", |
| "id": "da2dd0b7-d324-469d-92f8-0af74e1a1bae", | | "id": "ab70b341-9a9c-4551-bed9-db279f26181b", |
| "image_display_url": "", | | "image_display_url": "", |
n | "name": "object-segmentation", | n | "name": "semantic-compression", |
| "title": "Object Segmentation" | | "title": "Semantic Compression" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Semantic Segmentation", | | "display_name": "Semantic Segmentation", |
| "id": "8c3f2eee-f5f9-464d-9c0a-1a5e7a925c0e", | | "id": "8c3f2eee-f5f9-464d-9c0a-1a5e7a925c0e", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "semantic-segmentation", | | "name": "semantic-segmentation", |
| "title": "Semantic Segmentation" | | "title": "Semantic Segmentation" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
n | "display_name": "Text understanding", | n | "display_name": "Text-to-3D Generation", |
| "id": "45b4dd88-87d9-45de-bc51-fb07fe10880d", | | "id": "061d2d90-85de-40e4-88e5-b707757a8ce3", |
| "image_display_url": "", | | "image_display_url": "", |
n | "name": "text-understanding", | n | "name": "text-to-3d-generation", |
| "title": "Text understanding" | | "title": "Text-to-3D Generation" |
| }, | | }, |
| { | | { |
| "description": "", | | "description": "", |
| "display_name": "Visual Question Answering", | | "display_name": "Visual Question Answering", |
| "id": "e15f82e8-481e-43a8-8a39-d6e0751ace6c", | | "id": "e15f82e8-481e-43a8-8a39-d6e0751ace6c", |
| "image_display_url": "", | | "image_display_url": "", |
| "name": "visual-question-answering", | | "name": "visual-question-answering", |
| "title": "Visual Question Answering" | | "title": "Visual Question Answering" |
| } | | } |
| ], | | ], |
| "id": "79c51e3f-0168-45ce-a3f5-8e125e33295b", | | "id": "79c51e3f-0168-45ce-a3f5-8e125e33295b", |
| "isopen": false, | | "isopen": false, |
| "landing_page": "https://cocodataset.org/", | | "landing_page": "https://cocodataset.org/", |
| "license_title": null, | | "license_title": null, |
| "link_orkg": "", | | "link_orkg": "", |
| "metadata_created": "2024-11-25T14:44:47.163362", | | "metadata_created": "2024-11-25T14:44:47.163362", |
n | "metadata_modified": "2024-12-02T17:42:12.725790", | n | "metadata_modified": "2024-12-02T17:49:12.203135", |
| "name": "ms-coco", | | "name": "ms-coco", |
n | "notes": "MS COCO contains 80 object categories. Experimentally, a | n | "notes": "Large scale datasets [18, 17, 27, 6] boosted text |
| subset of the original large-scale is evaluated, which contain 39,107 | | conditional image generation quality. However, in some domains it |
| (40 classes) training samples, 5,895 validation samples (20 classes) | | could be difficult to make such datasets and usually it could be |
| and 9,763 testing samples (20 classes).", | | costly. Also, famous face datasets[7, 11, 13, 29] don\u2019t have |
| | | corresponding text captions, making it difficult to develop text |
| | | conditional image generation models on these datasets.", |
| "num_resources": 1, | | "num_resources": 0, |
| "num_tags": 53, | | "num_tags": 73, |
| "organization": { | | "organization": { |
| "approval_status": "approved", | | "approval_status": "approved", |
| "created": "2024-11-25T12:11:38.292601", | | "created": "2024-11-25T12:11:38.292601", |
| "description": "", | | "description": "", |
| "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "image_url": "", | | "image_url": "", |
| "is_organization": true, | | "is_organization": true, |
| "name": "no-organization", | | "name": "no-organization", |
| "state": "active", | | "state": "active", |
| "title": "No Organization", | | "title": "No Organization", |
| "type": "organization" | | "type": "organization" |
| }, | | }, |
| "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "private": false, | | "private": false, |
| "relationships_as_object": [], | | "relationships_as_object": [], |
| "relationships_as_subject": [], | | "relationships_as_subject": [], |
n | "resources": [ | n | "resources": [], |
| { | | |
| "cache_last_updated": null, | | |
| "cache_url": null, | | |
| "created": "2024-12-02T18:38:42", | | |
| "data": [ | | |
| "dcterms:title", | | |
| "dcterms:accessRights", | | |
| "dcterms:creator", | | |
| "dcterms:description", | | |
| "dcterms:issued", | | |
| "dcterms:language", | | |
| "dcterms:identifier", | | |
| "dcat:theme", | | |
| "dcterms:type", | | |
| "dcat:keyword", | | |
| "dcat:landingPage", | | |
| "dcterms:hasVersion", | | |
| "dcterms:format", | | |
| "mls:task", | | |
| "datacite:isDescribedBy" | | |
| ], | | |
| "description": "The json representation of the dataset with its | | |
| distributions based on DCAT.", | | |
| "format": "JSON", | | |
| "hash": "", | | |
| "id": "6ae4257b-d239-48d7-b954-d1c9e9bbb360", | | |
| "last_modified": "2024-12-02T17:42:12.711857", | | |
| "metadata_modified": "2024-12-02T17:42:12.728881", | | |
| "mimetype": "application/json", | | |
| "mimetype_inner": null, | | |
| "name": "Original Metadata", | | |
| "package_id": "79c51e3f-0168-45ce-a3f5-8e125e33295b", | | |
| "position": 0, | | |
| "resource_type": null, | | |
| "size": 3472, | | |
| "state": "active", | | |
| "url": | | |
| resource/6ae4257b-d239-48d7-b954-d1c9e9bbb360/download/metadata.json", | | |
| "url_type": "upload" | | |
| } | | |
| ], | | |
| "services_used_list": "", | | "services_used_list": "", |
| "state": "active", | | "state": "active", |
| "tags": [ | | "tags": [ |
| { | | { |
n | "display_name": "80 Classes", | n | |
| "id": "ae0598d9-c996-424a-8fef-40ac603d82aa", | | |
| "name": "80 Classes", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "COCO", | | "display_name": "COCO", |
| "id": "892a6596-c332-4778-b0bb-a1d1046c3cb8", | | "id": "892a6596-c332-4778-b0bb-a1d1046c3cb8", |
| "name": "COCO", | | "name": "COCO", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "COCO dataset", | n | |
| "id": "d3e1175b-c887-4a04-a77b-8ebe58dd7bd6", | | |
| "name": "COCO dataset", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Computer Vision", | | |
| "id": "77b96eda-8a43-406f-9c54-d87b14f3f63e", | | |
| "name": "Computer Vision", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Convolutional Neural Networks", | | "display_name": "Convolutional Neural Networks", |
| "id": "a167095b-f2a5-4c27-8f27-c413611cc4ee", | | "id": "a167095b-f2a5-4c27-8f27-c413611cc4ee", |
| "name": "Convolutional Neural Networks", | | "name": "Convolutional Neural Networks", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Deep Learning", | n | |
| "id": "3feb7b21-e049-4dca-9372-0d438c483f6a", | | |
| "name": "Deep Learning", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Depth Estimation", | | |
| "id": "559df65c-baac-4373-9e7e-6732051e61ec", | | |
| "name": "Depth Estimation", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Detection", | | "display_name": "Dataset", |
| "id": "0a1e40c9-2571-474a-ae08-794f6233e3a4", | | "id": "81587eb2-9569-4a4b-83c8-0e2ac78e7e3b", |
| "name": "Detection", | | "name": "Dataset", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Human Pose Estimation", | n | "display_name": "Image", |
| "id": "b8602e02-d7e3-4cd0-ad85-ba9ee8c2ad9d", | | "id": "ca701146-4139-43fe-a114-4f31ab3d20a1", |
| "name": "Human Pose Estimation", | | "name": "Image", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Image Captioning", | | "display_name": "Image Captioning", |
| "id": "c708cba4-0a1f-45c9-826f-898857783343", | | "id": "c708cba4-0a1f-45c9-826f-898857783343", |
| "name": "Image Captioning", | | "name": "Image Captioning", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Image Classification", | | "display_name": "Image Classification", |
| "id": "418e2ddf-a1d3-42ac-ad05-156f79ca8e22", | | "id": "418e2ddf-a1d3-42ac-ad05-156f79ca8e22", |
| "name": "Image Classification", | | "name": "Image Classification", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "Image Compression", |
| | | "id": "9319a62c-672c-4d44-a6ef-7d18ec5ba2b7", |
| | | "name": "Image Compression", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "Image Matting", | | "display_name": "Image Dataset", |
| "id": "80d1252a-d83f-4e8a-a19d-3cd31ec90a9d", | | "id": "51aed645-6dd9-4e08-894a-10944ecefd8b", |
| "name": "Image Matting", | | "name": "Image Dataset", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Image Processing", | n | "display_name": "Image Description", |
| "id": "38ebd60e-fd40-4275-a9d3-490f287011d6", | | "id": "d3ef3b7e-c8b4-4a5e-be62-11eed53a5567", |
| "name": "Image Processing", | | "name": "Image Description", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Image Segmentation", | n | "display_name": "Image Generation", |
| "id": "f5603951-aef2-4539-8066-15e72f32271b", | | "id": "a0db1a78-8e9a-494f-8d75-462dc3a45472", |
| "name": "Image Segmentation", | | "name": "Image Generation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Image segmentation", | n | "display_name": "Image Recognition", |
| "id": "8ab34344-1929-4cd3-a55a-af732b0cf13b", | | "id": "2cc216cd-24af-483e-8e50-6fcd86cf89ac", |
| "name": "Image segmentation", | | "name": "Image Recognition", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image classification", |
| | | "id": "786db19f-59bd-48ee-96c8-dfff6df61746", |
| | | "name": "Image classification", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image recognition", |
| | | "id": "27490e3f-0c09-4b94-aa76-8c5f3ff69797", |
| | | "name": "Image recognition", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "ImageNet", |
| | | "id": "114653a3-d688-42fb-8e76-350752af988b", |
| | | "name": "ImageNet", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Instance Segmentation", | | "display_name": "Instance Segmentation", |
| "id": "b58d8dfe-1216-401d-8a2a-ceb09e07a013", | | "id": "b58d8dfe-1216-401d-8a2a-ceb09e07a013", |
| "name": "Instance Segmentation", | | "name": "Instance Segmentation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "Large-Scale Dataset", |
| | | "id": "f3f5ec8d-52e3-4bcf-84ee-2dbca89fc84a", |
| | | "name": "Large-Scale Dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "Large Scale", | | "display_name": "Large-scale", |
| "id": "9d0a7af8-406e-4d7d-b558-ac2b45093bbf", | | "id": "9267d5a4-c0a1-4160-a509-c6db091b3758", |
| "name": "Large Scale", | | "name": "Large-scale", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Large-scale dataset", | | "display_name": "Large-scale dataset", |
| "id": "868f7828-1cf2-4bed-ba67-61c621bf1aa5", | | "id": "868f7828-1cf2-4bed-ba67-61c621bf1aa5", |
| "name": "Large-scale dataset", | | "name": "Large-scale dataset", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "MS COCO", | n | "display_name": "MS-COCO", |
| "id": "b8dcb1ca-8488-4b9b-9c1b-568b6f956b50", | | "id": "d4f2ee8f-d198-425a-aee5-b8fe8478c758", |
| "name": "MS COCO", | | "name": "MS-COCO", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multi-Label Classification", |
| | | "id": "65a87ec1-a7ee-4e32-bd56-df63df24a66a", |
| | | "name": "Multi-Label Classification", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multi-label", |
| | | "id": "314d8fc1-5e9e-4917-87fe-57fcc87231de", |
| | | "name": "Multi-label", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multi-label recognition", |
| | | "id": "3c14a70d-30f5-4069-a1c4-167d3cefbd9a", |
| | | "name": "Multi-label recognition", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Object Detection", | | "display_name": "Object Detection", |
| "id": "44adc011-570b-46cf-9a65-ab72ca690477", | | "id": "44adc011-570b-46cf-9a65-ab72ca690477", |
| "name": "Object Detection", | | "name": "Object Detection", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Object detection", | | "display_name": "Object detection", |
| "id": "84a57b7d-e522-4fc2-9f65-9aeb121659f1", | | "id": "84a57b7d-e522-4fc2-9f65-9aeb121659f1", |
| "name": "Object detection", | | "name": "Object detection", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Panoptic Segmentation", | n | |
| "id": "62316d6b-da93-440f-b9fd-8fddeba46d6d", | | |
| "name": "Panoptic Segmentation", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Query-based End-to-end Instance Segmentation", | | |
| "id": "db42449b-46c2-44a1-b9e3-9f2c7ce6a528", | | |
| "name": "Query-based End-to-end Instance Segmentation", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Scene Understanding", | | |
| "id": "d066cee5-d8a2-4d28-ba93-a32fa6a30b26", | | |
| "name": "Scene Understanding", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "Segmentation", | | "display_name": "Semantic Compression", |
| "id": "afba543e-f91f-4800-834e-77535c9e8dac", | | "id": "18787ad9-9dfb-4697-b4dc-bf8870d9f5a1", |
| "name": "Segmentation", | | "name": "Semantic Compression", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "Semantic Segmentation", | | "display_name": "Semantic Segmentation", |
| "id": "809ad6af-28cd-43bd-974d-055a5c0f2973", | | "id": "809ad6af-28cd-43bd-974d-055a5c0f2973", |
| "name": "Semantic Segmentation", | | "name": "Semantic Segmentation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "Visual Object Detection", | n | |
| "id": "f903c46b-dcbe-4c0a-a0b4-048cf8dc235f", | | |
| "name": "Visual Object Detection", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "anchor-free detection", | | "display_name": "Semantic segmentation", |
| "id": "cf61c3ac-3379-4ebf-9490-dcf82e027f58", | | "id": "ca545ae5-2da2-4e71-98b7-3268890347d1", |
| "name": "anchor-free detection", | | "name": "Semantic segmentation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "benchmark", | n | "display_name": "Text", |
| "id": "e3d4984e-822c-4023-a134-9cacabcfc36d", | | "id": "74f5b2bc-c290-4e26-a01d-cce9fdf6e957", |
| "name": "benchmark", | | "name": "Text", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "benchmark dataset", | n | "display_name": "Text-to-Image Diffusion Models", |
| "id": "8d55abf5-3c6a-42be-9dbe-7700f185ffc5", | | "id": "0bf9106e-0968-4133-a3fd-50e38577390f", |
| "name": "benchmark dataset", | | "name": "Text-to-Image Diffusion Models", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "User Attribution", |
| | | "id": "4fa164e9-c105-4fab-8c7f-bf8f8e152a7f", |
| | | "name": "User Attribution", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Weakly-Supervised Learning", |
| | | "id": "38084c25-2469-40e2-91a1-0c4ea361e2e7", |
| | | "name": "Weakly-Supervised Learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "ambiguities", |
| | | "id": "4b8b52a1-0846-40dd-a940-36ff6ea61ee9", |
| | | "name": "ambiguities", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "artistic style transfer", |
| | | "id": "7d1cd76d-a8de-46c5-ad29-280a33655324", |
| | | "name": "artistic style transfer", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "bounding box", |
| | | "id": "4e5ef5e7-c2b0-4c6e-800a-acbabc002635", |
| | | "name": "bounding box", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "bounding box regression", |
| | | "id": "2e04dc67-88c2-4b46-ad6d-72b676e72ffe", |
| | | "name": "bounding box regression", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "bounding boxes", | | "display_name": "bounding boxes", |
| "id": "54908a8b-6ff0-4302-bf30-6187778e8f6d", | | "id": "54908a8b-6ff0-4302-bf30-6187778e8f6d", |
| "name": "bounding boxes", | | "name": "bounding boxes", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "computer vision", | n | "display_name": "content images", |
| "id": "f650b4e3-9955-49b0-ba7b-2d302a990978", | | "id": "94315573-a2ad-4ef1-aaf5-b2dc04d1f144", |
| "name": "computer vision", | | "name": "content images", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "cross-modal retrieval", |
| | | "id": "18e4db93-438b-4f7c-a4a6-548f772a7291", |
| | | "name": "cross-modal retrieval", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "dataset", | | "display_name": "diffusion models", |
| "id": "ce5ad030-ca3d-47e6-abd1-5c92a2806f1b", | | "id": "67686580-d41a-4e00-875a-494e99951342", |
| | | "name": "diffusion models", |
| "name": "dataset", | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "few-shot learning", |
| | | "id": "9ed062d2-8c21-45d4-a7ff-78bf9cf0b117", |
| | | "name": "few-shot learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "foreground object", |
| | | "id": "3ca13def-8d96-449e-b764-69dded7dd96c", |
| | | "name": "foreground object", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "human pose estimation", | | "display_name": "human pose estimation", |
| "id": "2ba9bb7a-941e-4f02-8376-06b50691a7dd", | | "id": "2ba9bb7a-941e-4f02-8376-06b50691a7dd", |
| "name": "human pose estimation", | | "name": "human pose estimation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "image annotation", | n | |
| "id": "6734bcb9-ad78-4289-8816-09b71832ab8e", | | |
| "name": "image annotation", | | |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "image captioning", | | "display_name": "image captioning", |
| "id": "f1bbe827-a03a-4280-b9fa-0599ccfc0541", | | "id": "f1bbe827-a03a-4280-b9fa-0599ccfc0541", |
| "name": "image captioning", | | "name": "image captioning", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "image classification", | | "display_name": "image classification", |
| "id": "34936550-ce1a-41b5-8c58-23081a6c673d", | | "id": "34936550-ce1a-41b5-8c58-23081a6c673d", |
| "name": "image classification", | | "name": "image classification", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "image dataset", |
| | | "id": "d3acafab-ad07-46a1-88d5-540c2fd41466", |
| | | "name": "image dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "image description", | | "display_name": "image generation", |
| "id": "99e3a7d7-7ee7-4f66-adf4-28ac19f60923", | | "id": "96df81b4-32fd-4826-a903-affb005a0a60", |
| "name": "image description", | | "name": "image generation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "image recognition", | n | "display_name": "image retrieval", |
| "id": "5dbee310-ce23-4ee3-b86b-0ad4c203b2a6", | | "id": "93827714-41d5-4aac-a64a-f4390a0e80e1", |
| "name": "image recognition", | | "name": "image retrieval", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "image segmentation", | | "display_name": "image segmentation", |
| "id": "7eaed78e-c73a-4929-a8c9-60265069f59a", | | "id": "7eaed78e-c73a-4929-a8c9-60265069f59a", |
| "name": "image segmentation", | | "name": "image segmentation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "image style transfer", |
| | | "id": "e1dd21b6-af66-4e38-b4d6-a6dbe6ed5219", |
| | | "name": "image style transfer", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "image understanding", | | "display_name": "image-text matching", |
| "id": "a209b790-086a-4345-b6af-b7b011b6e040", | | "id": "75c56b7d-ab6b-4dd8-88f8-67e92928dca0", |
| "name": "image understanding", | | "name": "image-text matching", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "image-text retrieval", | n | "display_name": "image-text pairs", |
| "id": "2ce62fa7-a31e-4be3-9312-92be69a8726b", | | "id": "07cb3691-65c6-4b58-b3bf-5290980a86e3", |
| "name": "image-text retrieval", | | "name": "image-text pairs", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "images", | | "display_name": "images", |
| "id": "40152090-cbbf-4339-b7d3-f14b68cb7621", | | "id": "40152090-cbbf-4339-b7d3-f14b68cb7621", |
| "name": "images", | | "name": "images", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "instance segmentation", | | "display_name": "instance segmentation", |
| "id": "e74e609d-6e81-4b83-b74e-fa3dd8f185f4", | | "id": "e74e609d-6e81-4b83-b74e-fa3dd8f185f4", |
| "name": "instance segmentation", | | "name": "instance segmentation", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "keypoints", | n | "display_name": "keypoint detection", |
| "id": "d8c2caaa-a318-4485-91a0-e9dc1826e52e", | | "id": "656a55a9-2bad-4a54-90fa-1b298d7fe6bf", |
| "name": "keypoints", | | "name": "keypoint detection", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "large scale", |
| | | "id": "eb1c6e7f-f9b1-4844-a978-4a80ae7e0476", |
| | | "name": "large scale", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "large-scale benchmark", |
| | | "id": "d0b12015-10bd-4b97-9e34-1512b9f514ae", |
| | | "name": "large-scale benchmark", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "large dataset", | | "display_name": "large-scale dataset", |
| "id": "39deedcc-46cf-4eba-8ec8-41743e462923", | | "id": "a9c694bf-f591-4625-a20e-d53d3f90d489", |
| "name": "large dataset", | | "name": "large-scale dataset", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "low-quality examples", |
| | | "id": "409d0d3d-2065-4842-b2d4-64930e049231", |
| | | "name": "low-quality examples", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "multi-label", |
| | | "id": "ee29530d-cfee-42e6-b05b-e9d914289227", |
| | | "name": "multi-label", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "multi-person pose estimation", |
| | | "id": "5eb1fbbf-53f3-4750-8d3c-b8d36cb6718a", |
| | | "name": "multi-person pose estimation", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "multiple object detection", | | "display_name": "multiple captions", |
| "id": "9d5c3f06-b2c1-462b-9abf-5c774e5ce105", | | "id": "15d57fa3-3639-4191-8495-a03fdd0c86ba", |
| "name": "multiple object detection", | | "name": "multiple captions", |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "neural networks", | | |
| "id": "8ef5d32b-4073-4531-87bc-4b4676fd22b8", | | |
| "name": "neural networks", | | |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
| "display_name": "object detection", | | "display_name": "object detection", |
| "id": "607283c7-9e12-4167-9101-7f8078fb6537", | | "id": "607283c7-9e12-4167-9101-7f8078fb6537", |
| "name": "object detection", | | "name": "object detection", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | "display_name": "object segmentation", | n | "display_name": "object-centric", |
| "id": "6a47ecb7-e3fb-43a9-b0a8-1434387d3ee4", | | "id": "ebb4fd2a-1234-4199-ba72-314c03346982", |
| "name": "object segmentation", | | "name": "object-centric", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "photorealistic style transfer", |
| | | "id": "c3c24f7d-e28d-42bb-8c2a-7809bd365902", |
| | | "name": "photorealistic style transfer", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "sentence retrieval", |
| | | "id": "105d8c3e-8fb7-4da0-b82b-80a38468cdb1", |
| | | "name": "sentence retrieval", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "style images", |
| | | "id": "b3dee3dd-1cec-49a5-a593-a82047b55122", |
| | | "name": "style images", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "style transfer", |
| | | "id": "85201f92-7e39-4465-a7fa-95893969ecb2", |
| | | "name": "style transfer", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "text-to-3D", |
| | | "id": "f241a1fe-f740-4dea-92ab-ed0458ba05ce", |
| | | "name": "text-to-3D", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "text-to-image synthesis", |
| | | "id": "c37dcb7d-7577-4b8f-95ae-252797eb5cce", |
| | | "name": "text-to-image synthesis", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "semantic labeling", | | "display_name": "vision and language", |
| "id": "75c04c50-d8e4-4f25-91ab-8cdf91f69f96", | | "id": "3745ee63-01b9-4847-8aeb-4d8a32d5b9f7", |
| "name": "semantic labeling", | | "name": "vision and language", |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| }, | | }, |
| { | | { |
n | | n | "display_name": "vision-language", |
| | | "id": "81685daa-749b-408e-97dc-4ca793a0f68d", |
| | | "name": "vision-language", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "weakly supervised", |
| | | "id": "72956467-0404-428c-a719-92da4113456d", |
| | | "name": "weakly supervised", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| "display_name": "text understanding", | | "display_name": "zero-shot learning", |
| "id": "1769ec7b-a07a-4080-9866-ecc2cf5a5208", | | "id": "a5085ccf-44ae-4bee-a51e-3fc7c7d9ac69", |
| "name": "text understanding", | | "name": "zero-shot learning", |
| "state": "active", | | |
| "vocabulary_id": null | | |
| }, | | |
| { | | |
| "display_name": "visual question answering", | | |
| "id": "8be24887-e029-464f-b56c-1d0a460e2005", | | |
| "name": "visual question answering", | | |
| "state": "active", | | "state": "active", |
| "vocabulary_id": null | | "vocabulary_id": null |
| } | | } |
| ], | | ], |
t | "title": "MS COCO", | t | "title": "MS-COCO", |
| "type": "dataset", | | "type": "dataset", |
| "version": "" | | "version": "" |
| } | | } |