f | { | f | { |
| "access_rights": "", | | "access_rights": "", |
| "author": "Piyush Sharma", | | "author": "Piyush Sharma", |
| "author_email": "", | | "author_email": "", |
| "citation": [ | | "citation": [ |
n | | n | "https://doi.org/10.48550/arXiv.2306.15447", |
| "https://doi.org/10.48550/arXiv.1908.08530" | | "https://doi.org/10.48550/arXiv.2406.09305", |
| | | "https://doi.org/10.48550/arXiv.2106.13884", |
| | | "https://doi.org/10.48550/arXiv.2209.14667", |
| | | "https://doi.org/10.48550/arXiv.2303.12419", |
| | | "https://doi.org/10.48550/arXiv.2305.17718", |
| | | "https://doi.org/10.48550/arXiv.2208.04060", |
| | | "https://doi.org/10.48550/arXiv.2304.02828", |
| | | "https://doi.org/10.48550/arXiv.2007.08617", |
| | | "https://doi.org/10.48550/arXiv.2310.19654" |
| ], | | ], |
| "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", | | "creator_user_id": "17755db4-395a-4b3b-ac09-e8e3484ca700", |
n | "defined_in": "https://doi.org/10.48550/arXiv.1909.11059", | n | "defined_in": "https://doi.org/10.48550/arXiv.2312.04567", |
| "doi": "10.57702/6qvb3f54", | | "doi": "10.57702/6qvb3f54", |
| "doi_date_published": "2024-11-25", | | "doi_date_published": "2024-11-25", |
| "doi_publisher": "TIB", | | "doi_publisher": "TIB", |
| "doi_status": true, | | "doi_status": true, |
| "domain": "https://service.tib.eu/ldmservice", | | "domain": "https://service.tib.eu/ldmservice", |
| "extra_authors": [ | | "extra_authors": [ |
| { | | { |
| "extra_author": "Nan Ding", | | "extra_author": "Nan Ding", |
| "orcid": "" | | "orcid": "" |
| }, | | }, |
| { | | { |
| "extra_author": "Sebastian Goodman", | | "extra_author": "Sebastian Goodman", |
| "orcid": "" | | "orcid": "" |
| }, | | }, |
| { | | { |
| "extra_author": "Radu Soricut", | | "extra_author": "Radu Soricut", |
| "orcid": "" | | "orcid": "" |
| } | | } |
| ], | | ], |
n | "groups": [], | n | "groups": [ |
| | | { |
| | | "description": "", |
| | | "display_name": "Image Captioning", |
| | | "id": "7a76ce67-2607-4da9-a837-d2017dc33ec6", |
| | | "image_display_url": "", |
| | | "name": "image-captioning", |
| | | "title": "Image Captioning" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Image-Text Retrieval", |
| | | "id": "28bbc5c8-e229-4df6-9cf1-d2040f80541a", |
| | | "image_display_url": "", |
| | | "name": "image-text-retrieval", |
| | | "title": "Image-Text Retrieval" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Multimodal Learning", |
| | | "id": "a88cb918-103d-4226-a87d-9d9103c1f839", |
| | | "image_display_url": "", |
| | | "name": "multimodal-learning", |
| | | "title": "Multimodal Learning" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Question Answering", |
| | | "id": "01e9bd6b-910d-421d-bb31-799604023211", |
| | | "image_display_url": "", |
| | | "name": "question-answering", |
| | | "title": "Question Answering" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Vision-and-Language Models", |
| | | "id": "8859491a-95fd-495f-9e99-91165571544a", |
| | | "image_display_url": "", |
| | | "name": "vision-and-language-models", |
| | | "title": "Vision-and-Language Models" |
| | | }, |
| | | { |
| | | "description": "", |
| | | "display_name": "Visual Question Answering", |
| | | "id": "e15f82e8-481e-43a8-8a39-d6e0751ace6c", |
| | | "image_display_url": "", |
| | | "name": "visual-question-answering", |
| | | "title": "Visual Question Answering" |
| | | } |
| | | ], |
| "id": "9607542b-7580-4898-aab0-72dc1ec56289", | | "id": "9607542b-7580-4898-aab0-72dc1ec56289", |
| "isopen": false, | | "isopen": false, |
n | "landing_page": "", | n | "landing_page": |
| | | "https://github.com/soravit-changpinyo/Conceptual-Captions", |
| "license_title": null, | | "license_title": null, |
| "link_orkg": "", | | "link_orkg": "", |
| "metadata_created": "2024-11-25T14:19:56.278602", | | "metadata_created": "2024-11-25T14:19:56.278602", |
n | "metadata_modified": "2024-11-25T14:33:09.899762", | n | "metadata_modified": "2024-12-02T22:05:36.278874", |
| "name": "conceptual-captions", | | "name": "conceptual-captions", |
n | "notes": "Conceptual Captions is a large-scale real-world dataset | n | "notes": "The dataset used in the paper \"Scaling Laws of Synthetic |
| that contains approximately 3% to 20% mismatched image-text pairs, | | Images for Model Training\". The dataset is used for supervised image |
| comprising 3,334,173 images with a single caption each.", | | classification and zero-shot classification tasks.", |
| "num_resources": 1, | | "num_resources": 0, |
| "num_tags": 0, | | "num_tags": 18, |
| "organization": { | | "organization": { |
| "approval_status": "approved", | | "approval_status": "approved", |
| "created": "2024-11-25T12:11:38.292601", | | "created": "2024-11-25T12:11:38.292601", |
| "description": "", | | "description": "", |
| "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "id": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "image_url": "", | | "image_url": "", |
| "is_organization": true, | | "is_organization": true, |
| "name": "no-organization", | | "name": "no-organization", |
| "state": "active", | | "state": "active", |
| "title": "No Organization", | | "title": "No Organization", |
| "type": "organization" | | "type": "organization" |
| }, | | }, |
| "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", | | "owner_org": "079d46db-32df-4b48-91f3-0a8bc8f69559", |
| "private": false, | | "private": false, |
| "relationships_as_object": [], | | "relationships_as_object": [], |
| "relationships_as_subject": [], | | "relationships_as_subject": [], |
n | "resources": [ | n | "resources": [], |
| { | | |
| "cache_last_updated": null, | | |
| "cache_url": null, | | |
| "created": "2024-11-25T15:30:26", | | |
| "data": [ | | |
| "dcterms:title", | | |
| "dcterms:accessRights", | | |
| "dcterms:creator", | | |
| "dcterms:description", | | |
| "dcterms:issued", | | |
| "dcterms:language", | | |
| "dcterms:identifier", | | |
| "dcat:theme", | | |
| "dcterms:type", | | |
| "dcat:keyword", | | |
| "dcat:landingPage", | | |
| "dcterms:hasVersion", | | |
| "dcterms:format", | | |
| "mls:task", | | |
| "datacite:isDescribedBy" | | |
| ], | | |
| "description": "The json representation of the dataset with its | | |
| distributions based on DCAT.", | | |
| "format": "JSON", | | |
| "hash": "", | | |
| "id": "86aeedcf-e77a-470a-b13f-c5325d70a86c", | | |
| "last_modified": "2024-11-25T14:33:09.891953", | | |
| "metadata_modified": "2024-11-25T14:33:09.903229", | | |
| "mimetype": "application/json", | | |
| "mimetype_inner": null, | | |
| "name": "Original Metadata", | | |
| "package_id": "9607542b-7580-4898-aab0-72dc1ec56289", | | |
| "position": 0, | | |
| "resource_type": null, | | |
| "size": 1052, | | |
| "state": "active", | | |
| "url": | | |
| resource/86aeedcf-e77a-470a-b13f-c5325d70a86c/download/metadata.json", | | |
| "url_type": "upload" | | |
| } | | |
| ], | | |
| "services_used_list": "", | | "services_used_list": "", |
| "state": "active", | | "state": "active", |
n | "tags": [], | n | "tags": [ |
| | | { |
| | | "display_name": "Conceptual Captions", |
| | | "id": "c0b7fb3a-fb3c-49f6-ad33-6907b0c8e7e7", |
| | | "name": "Conceptual Captions", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Dataset", |
| | | "id": "81587eb2-9569-4a4b-83c8-0e2ac78e7e3b", |
| | | "name": "Dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Image Captioning", |
| | | "id": "c708cba4-0a1f-45c9-826f-898857783343", |
| | | "name": "Image Captioning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multimodal Data", |
| | | "id": "fbeb6437-73ab-4d00-aaba-4fff5139add9", |
| | | "name": "Multimodal Data", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Multimodal Learning", |
| | | "id": "41329983-d90e-4560-a97d-7fa2ba0a1f92", |
| | | "name": "Multimodal Learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "Question Answering", |
| | | "id": "90f0a19e-b0c2-47b9-9180-dd38182c8003", |
| | | "name": "Question Answering", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "conceptual captions", |
| | | "id": "0ecb2a3a-1e29-4dbe-8026-fc3e1bb4a1b0", |
| | | "name": "conceptual captions", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "dataset", |
| | | "id": "ce5ad030-ca3d-47e6-abd1-5c92a2806f1b", |
| | | "name": "dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image captioning", |
| | | "id": "f1bbe827-a03a-4280-b9fa-0599ccfc0541", |
| | | "name": "image captioning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image-text pairs", |
| | | "id": "07cb3691-65c6-4b58-b3bf-5290980a86e3", |
| | | "name": "image-text pairs", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "image-text retrieval", |
| | | "id": "2ce62fa7-a31e-4be3-9312-92be69a8726b", |
| | | "name": "image-text retrieval", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "large language models", |
| | | "id": "a8509b72-f238-4646-ab16-be50d0c7514c", |
| | | "name": "large language models", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "large-scale dataset", |
| | | "id": "a9c694bf-f591-4625-a20e-d53d3f90d489", |
| | | "name": "large-scale dataset", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "loosely correlated", |
| | | "id": "d6aa6150-1dd6-4474-ad4d-f37c8c893f42", |
| | | "name": "loosely correlated", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "multimodal learning", |
| | | "id": "0decb357-2292-4127-9886-35e2f72c9df2", |
| | | "name": "multimodal learning", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "vision and language", |
| | | "id": "3745ee63-01b9-4847-8aeb-4d8a32d5b9f7", |
| | | "name": "vision and language", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "vision-and-language models", |
| | | "id": "7645deef-42d9-4294-a894-9829f9c04122", |
| | | "name": "vision-and-language models", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | }, |
| | | { |
| | | "display_name": "visual question answering", |
| | | "id": "8be24887-e029-464f-b56c-1d0a460e2005", |
| | | "name": "visual question answering", |
| | | "state": "active", |
| | | "vocabulary_id": null |
| | | } |
| | | ], |
| "title": "Conceptual Captions", | | "title": "Conceptual Captions", |
| "type": "dataset", | | "type": "dataset", |
t | "version": "CC152K" | t | "version": "" |
| } | | } |