Changes
On December 21, 2024 at 1:03:06 PM UTC, Ahmad Sakor:
-
Added resource Evaluation Dataset to Pipeline for Arabic Legal Text Summarization Dataset
f | 1 | { | f | 1 | { |
2 | "access_rights": "", | 2 | "access_rights": "", | ||
3 | "accrualPeriodicity": "", | 3 | "accrualPeriodicity": "", | ||
4 | "author": "Ahmad Sakor", | 4 | "author": "Ahmad Sakor", | ||
5 | "author_email": "", | 5 | "author_email": "", | ||
6 | "citation": [], | 6 | "citation": [], | ||
7 | "conformsTo": "", | 7 | "conformsTo": "", | ||
8 | "creator_user_id": "0728da89-2020-4436-afb1-80580688ed61", | 8 | "creator_user_id": "0728da89-2020-4436-afb1-80580688ed61", | ||
9 | "defined_in": "", | 9 | "defined_in": "", | ||
10 | "doi": "10.57702/djfcf0oa", | 10 | "doi": "10.57702/djfcf0oa", | ||
11 | "doi_date_published": "2024-12-21", | 11 | "doi_date_published": "2024-12-21", | ||
12 | "doi_publisher": "TIB", | 12 | "doi_publisher": "TIB", | ||
13 | "doi_status": true, | 13 | "doi_status": true, | ||
14 | "domain": "https://service.tib.eu/ldmservice", | 14 | "domain": "https://service.tib.eu/ldmservice", | ||
15 | "end_date": "", | 15 | "end_date": "", | ||
16 | "extra_authors": [ | 16 | "extra_authors": [ | ||
17 | { | 17 | { | ||
18 | "extra_author": "", | 18 | "extra_author": "", | ||
19 | "orcid": "" | 19 | "orcid": "" | ||
20 | } | 20 | } | ||
21 | ], | 21 | ], | ||
22 | "extras": [ | 22 | "extras": [ | ||
23 | { | 23 | { | ||
24 | "__extras": { | 24 | "__extras": { | ||
25 | "id": "a8053c50-7de2-4367-a6a5-66b7c2a0a0d6", | 25 | "id": "a8053c50-7de2-4367-a6a5-66b7c2a0a0d6", | ||
26 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 26 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
27 | "state": "active" | 27 | "state": "active" | ||
28 | }, | 28 | }, | ||
29 | "key": "", | 29 | "key": "", | ||
30 | "value": "" | 30 | "value": "" | ||
31 | } | 31 | } | ||
32 | ], | 32 | ], | ||
33 | "groups": [], | 33 | "groups": [], | ||
34 | "id": "36f85159-319d-4244-abff-69dc9dbb393d", | 34 | "id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
35 | "isopen": false, | 35 | "isopen": false, | ||
36 | "landing_page": "", | 36 | "landing_page": "", | ||
37 | "language": "", | 37 | "language": "", | ||
38 | "license_id": "notspecified", | 38 | "license_id": "notspecified", | ||
39 | "license_title": "License not specified", | 39 | "license_title": "License not specified", | ||
40 | "link_orkg": "", | 40 | "link_orkg": "", | ||
41 | "maintainer": "", | 41 | "maintainer": "", | ||
42 | "maintainer_email": "", | 42 | "maintainer_email": "", | ||
43 | "metadata_created": "2024-12-21T12:50:03.115243", | 43 | "metadata_created": "2024-12-21T12:50:03.115243", | ||
n | 44 | "metadata_modified": "2024-12-21T13:02:19.866206", | n | 44 | "metadata_modified": "2024-12-21T13:03:05.633355", |
45 | "name": "pipeline-for-arabic-legal-text-summarization-dataset", | 45 | "name": "pipeline-for-arabic-legal-text-summarization-dataset", | ||
46 | "notes": "This dataset contains the data used for the Pipeline for | 46 | "notes": "This dataset contains the data used for the Pipeline for | ||
47 | Arabic Legal Text Summarization", | 47 | Arabic Legal Text Summarization", | ||
n | 48 | "num_resources": 5, | n | 48 | "num_resources": 6, |
49 | "num_tags": 0, | 49 | "num_tags": 0, | ||
50 | "orcid": "", | 50 | "orcid": "", | ||
51 | "organization": { | 51 | "organization": { | ||
52 | "approval_status": "approved", | 52 | "approval_status": "approved", | ||
53 | "created": "2017-11-23T17:30:37.757128", | 53 | "created": "2017-11-23T17:30:37.757128", | ||
54 | "description": "The German National Library of Science and | 54 | "description": "The German National Library of Science and | ||
55 | Technology, abbreviated TIB, is the national library of the Federal | 55 | Technology, abbreviated TIB, is the national library of the Federal | ||
56 | Republic of Germany for all fields of engineering, technology, and the | 56 | Republic of Germany for all fields of engineering, technology, and the | ||
57 | natural sciences.", | 57 | natural sciences.", | ||
58 | "id": "0c5362f5-b99e-41db-8256-3d0d7549bf4d", | 58 | "id": "0c5362f5-b99e-41db-8256-3d0d7549bf4d", | ||
59 | "image_url": | 59 | "image_url": | ||
60 | 3conf/ext/tib_tmpl_bootstrap/Resources/Public/images/TIB_Logo_en.png", | 60 | 3conf/ext/tib_tmpl_bootstrap/Resources/Public/images/TIB_Logo_en.png", | ||
61 | "is_organization": true, | 61 | "is_organization": true, | ||
62 | "name": "tib", | 62 | "name": "tib", | ||
63 | "state": "active", | 63 | "state": "active", | ||
64 | "title": "TIB", | 64 | "title": "TIB", | ||
65 | "type": "organization" | 65 | "type": "organization" | ||
66 | }, | 66 | }, | ||
67 | "owner_org": "0c5362f5-b99e-41db-8256-3d0d7549bf4d", | 67 | "owner_org": "0c5362f5-b99e-41db-8256-3d0d7549bf4d", | ||
68 | "page": "", | 68 | "page": "", | ||
69 | "private": false, | 69 | "private": false, | ||
70 | "relationships_as_object": [], | 70 | "relationships_as_object": [], | ||
71 | "relationships_as_subject": [], | 71 | "relationships_as_subject": [], | ||
72 | "resources": [ | 72 | "resources": [ | ||
73 | { | 73 | { | ||
74 | "auto_update_last_update": "", | 74 | "auto_update_last_update": "", | ||
75 | "cache_last_updated": null, | 75 | "cache_last_updated": null, | ||
76 | "cache_url": null, | 76 | "cache_url": null, | ||
77 | "created": "2024-12-21T12:52:05.522447", | 77 | "created": "2024-12-21T12:52:05.522447", | ||
78 | "description": "The gold standard built using GPT-4 in JSON | 78 | "description": "The gold standard built using GPT-4 in JSON | ||
79 | format.\r\nIt contains the summaries for the input legal cases text", | 79 | format.\r\nIt contains the summaries for the input legal cases text", | ||
80 | "format": "JSON", | 80 | "format": "JSON", | ||
81 | "hash": "", | 81 | "hash": "", | ||
82 | "id": "d2eb87ed-9f05-45a7-8196-d8b3aca86c97", | 82 | "id": "d2eb87ed-9f05-45a7-8196-d8b3aca86c97", | ||
83 | "language": "Arabic", | 83 | "language": "Arabic", | ||
84 | "last_modified": "2024-12-21T12:52:05.504552", | 84 | "last_modified": "2024-12-21T12:52:05.504552", | ||
85 | "media": "", | 85 | "media": "", | ||
86 | "metadata_modified": "2024-12-21T12:52:05.518962", | 86 | "metadata_modified": "2024-12-21T12:52:05.518962", | ||
87 | "mimetype": "application/zip", | 87 | "mimetype": "application/zip", | ||
88 | "mimetype_inner": null, | 88 | "mimetype_inner": null, | ||
89 | "name": "Gold Standard", | 89 | "name": "Gold Standard", | ||
90 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 90 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
91 | "position": 0, | 91 | "position": 0, | ||
92 | "resource_type": null, | 92 | "resource_type": null, | ||
93 | "rights": "", | 93 | "rights": "", | ||
94 | "size": 83404108, | 94 | "size": 83404108, | ||
95 | "state": "active", | 95 | "state": "active", | ||
96 | "url": | 96 | "url": | ||
97 | esource/d2eb87ed-9f05-45a7-8196-d8b3aca86c97/download/json_files.zip", | 97 | esource/d2eb87ed-9f05-45a7-8196-d8b3aca86c97/download/json_files.zip", | ||
98 | "url_type": "upload" | 98 | "url_type": "upload" | ||
99 | }, | 99 | }, | ||
100 | { | 100 | { | ||
101 | "auto_update_last_update": "", | 101 | "auto_update_last_update": "", | ||
102 | "cache_last_updated": null, | 102 | "cache_last_updated": null, | ||
103 | "cache_url": null, | 103 | "cache_url": null, | ||
104 | "created": "2024-12-21T12:55:38.720753", | 104 | "created": "2024-12-21T12:55:38.720753", | ||
105 | "description": "This file contains the extracted text from the | 105 | "description": "This file contains the extracted text from the | ||
106 | PDFs of the legal cases", | 106 | PDFs of the legal cases", | ||
107 | "format": "TXT", | 107 | "format": "TXT", | ||
108 | "hash": "", | 108 | "hash": "", | ||
109 | "id": "5ce92d8e-1be3-48e7-b1f4-7648e6cb4505", | 109 | "id": "5ce92d8e-1be3-48e7-b1f4-7648e6cb4505", | ||
110 | "language": "Arabic", | 110 | "language": "Arabic", | ||
111 | "last_modified": "2024-12-21T12:55:38.701633", | 111 | "last_modified": "2024-12-21T12:55:38.701633", | ||
112 | "media": "", | 112 | "media": "", | ||
113 | "metadata_modified": "2024-12-21T12:55:38.717076", | 113 | "metadata_modified": "2024-12-21T12:55:38.717076", | ||
114 | "mimetype": "application/zip", | 114 | "mimetype": "application/zip", | ||
115 | "mimetype_inner": null, | 115 | "mimetype_inner": null, | ||
116 | "name": "The extracted text of the cases", | 116 | "name": "The extracted text of the cases", | ||
117 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 117 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
118 | "position": 1, | 118 | "position": 1, | ||
119 | "resource_type": null, | 119 | "resource_type": null, | ||
120 | "rights": "", | 120 | "rights": "", | ||
121 | "size": 75326724, | 121 | "size": 75326724, | ||
122 | "state": "active", | 122 | "state": "active", | ||
123 | "url": | 123 | "url": | ||
124 | esource/5ce92d8e-1be3-48e7-b1f4-7648e6cb4505/download/text_files.zip", | 124 | esource/5ce92d8e-1be3-48e7-b1f4-7648e6cb4505/download/text_files.zip", | ||
125 | "url_type": "upload" | 125 | "url_type": "upload" | ||
126 | }, | 126 | }, | ||
127 | { | 127 | { | ||
128 | "auto_update_last_update": "", | 128 | "auto_update_last_update": "", | ||
129 | "cache_last_updated": null, | 129 | "cache_last_updated": null, | ||
130 | "cache_url": null, | 130 | "cache_url": null, | ||
131 | "created": "2024-12-21T12:58:13.131444", | 131 | "created": "2024-12-21T12:58:13.131444", | ||
132 | "description": "this files contains the generated output for the | 132 | "description": "this files contains the generated output for the | ||
133 | fine tuned model", | 133 | fine tuned model", | ||
134 | "format": "jsonl", | 134 | "format": "jsonl", | ||
135 | "hash": "", | 135 | "hash": "", | ||
136 | "id": "7e768106-75e8-490e-a906-8330349dbe6e", | 136 | "id": "7e768106-75e8-490e-a906-8330349dbe6e", | ||
137 | "language": "Arabic", | 137 | "language": "Arabic", | ||
138 | "last_modified": "2024-12-21T12:58:13.112030", | 138 | "last_modified": "2024-12-21T12:58:13.112030", | ||
139 | "media": "", | 139 | "media": "", | ||
140 | "metadata_modified": "2024-12-21T12:58:13.127965", | 140 | "metadata_modified": "2024-12-21T12:58:13.127965", | ||
141 | "mimetype": null, | 141 | "mimetype": null, | ||
142 | "mimetype_inner": null, | 142 | "mimetype_inner": null, | ||
143 | "name": "generated output of the fine tuned model", | 143 | "name": "generated output of the fine tuned model", | ||
144 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 144 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
145 | "position": 2, | 145 | "position": 2, | ||
146 | "resource_type": null, | 146 | "resource_type": null, | ||
147 | "rights": "", | 147 | "rights": "", | ||
148 | "size": 39440803, | 148 | "size": 39440803, | ||
149 | "state": "active", | 149 | "state": "active", | ||
150 | "url": | 150 | "url": | ||
151 | -a906-8330349dbe6e/download/generated_outputs_fine_tuned_model.jsonl", | 151 | -a906-8330349dbe6e/download/generated_outputs_fine_tuned_model.jsonl", | ||
152 | "url_type": "upload" | 152 | "url_type": "upload" | ||
153 | }, | 153 | }, | ||
154 | { | 154 | { | ||
155 | "auto_update_last_update": "", | 155 | "auto_update_last_update": "", | ||
156 | "cache_last_updated": null, | 156 | "cache_last_updated": null, | ||
157 | "cache_url": null, | 157 | "cache_url": null, | ||
158 | "created": "2024-12-21T12:59:10.386995", | 158 | "created": "2024-12-21T12:59:10.386995", | ||
159 | "description": "This file contains the generated output for the | 159 | "description": "This file contains the generated output for the | ||
160 | base model", | 160 | base model", | ||
161 | "format": "jsonl", | 161 | "format": "jsonl", | ||
162 | "hash": "", | 162 | "hash": "", | ||
163 | "id": "6e64ab34-faf1-4ac2-9afe-431293ca4cd1", | 163 | "id": "6e64ab34-faf1-4ac2-9afe-431293ca4cd1", | ||
164 | "language": "Arabic", | 164 | "language": "Arabic", | ||
165 | "last_modified": "2024-12-21T12:59:10.364168", | 165 | "last_modified": "2024-12-21T12:59:10.364168", | ||
166 | "media": "", | 166 | "media": "", | ||
167 | "metadata_modified": "2024-12-21T12:59:10.382996", | 167 | "metadata_modified": "2024-12-21T12:59:10.382996", | ||
168 | "mimetype": null, | 168 | "mimetype": null, | ||
169 | "mimetype_inner": null, | 169 | "mimetype_inner": null, | ||
170 | "name": "generated output of the base model", | 170 | "name": "generated output of the base model", | ||
171 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 171 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
172 | "position": 3, | 172 | "position": 3, | ||
173 | "resource_type": null, | 173 | "resource_type": null, | ||
174 | "rights": "", | 174 | "rights": "", | ||
175 | "size": 38719159, | 175 | "size": 38719159, | ||
176 | "state": "active", | 176 | "state": "active", | ||
177 | "url": | 177 | "url": | ||
178 | 1-4ac2-9afe-431293ca4cd1/download/generated_outputs_base_model.jsonl", | 178 | 1-4ac2-9afe-431293ca4cd1/download/generated_outputs_base_model.jsonl", | ||
179 | "url_type": "upload" | 179 | "url_type": "upload" | ||
180 | }, | 180 | }, | ||
181 | { | 181 | { | ||
182 | "auto_update_last_update": "", | 182 | "auto_update_last_update": "", | ||
183 | "cache_last_updated": null, | 183 | "cache_last_updated": null, | ||
184 | "cache_url": null, | 184 | "cache_url": null, | ||
185 | "created": "2024-12-21T13:02:19.874089", | 185 | "created": "2024-12-21T13:02:19.874089", | ||
186 | "description": "this file contains the training dataset used for | 186 | "description": "this file contains the training dataset used for | ||
187 | fine tuning the model", | 187 | fine tuning the model", | ||
188 | "format": "jsonl", | 188 | "format": "jsonl", | ||
189 | "hash": "", | 189 | "hash": "", | ||
190 | "id": "21ef5269-2693-4f07-98f6-8b0b58fcc3a2", | 190 | "id": "21ef5269-2693-4f07-98f6-8b0b58fcc3a2", | ||
191 | "language": "Arabic", | 191 | "language": "Arabic", | ||
192 | "last_modified": "2024-12-21T13:02:19.851653", | 192 | "last_modified": "2024-12-21T13:02:19.851653", | ||
193 | "media": "", | 193 | "media": "", | ||
194 | "metadata_modified": "2024-12-21T13:02:19.869911", | 194 | "metadata_modified": "2024-12-21T13:02:19.869911", | ||
195 | "mimetype": null, | 195 | "mimetype": null, | ||
196 | "mimetype_inner": null, | 196 | "mimetype_inner": null, | ||
197 | "name": "Training dataset", | 197 | "name": "Training dataset", | ||
198 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | 198 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||
199 | "position": 4, | 199 | "position": 4, | ||
200 | "resource_type": null, | 200 | "resource_type": null, | ||
201 | "rights": "", | 201 | "rights": "", | ||
202 | "size": 292869775, | 202 | "size": 292869775, | ||
203 | "state": "active", | 203 | "state": "active", | ||
204 | "url": | 204 | "url": | ||
205 | f5269-2693-4f07-98f6-8b0b58fcc3a2/download/train_dataset_final.jsonl", | 205 | f5269-2693-4f07-98f6-8b0b58fcc3a2/download/train_dataset_final.jsonl", | ||
206 | "url_type": "upload" | 206 | "url_type": "upload" | ||
t | t | 207 | }, | ||
208 | { | ||||
209 | "auto_update_last_update": "", | ||||
210 | "cache_last_updated": null, | ||||
211 | "cache_url": null, | ||||
212 | "created": "2024-12-21T13:03:05.641426", | ||||
213 | "description": "This file contains the evaluation dataset used | ||||
214 | in the experiments ", | ||||
215 | "format": "jsonl", | ||||
216 | "hash": "", | ||||
217 | "id": "29bce7e4-0d2d-4b4a-b1d5-136f13143a40", | ||||
218 | "language": "Arabic", | ||||
219 | "last_modified": "2024-12-21T13:03:05.618157", | ||||
220 | "media": "", | ||||
221 | "metadata_modified": "2024-12-21T13:03:05.637027", | ||||
222 | "mimetype": null, | ||||
223 | "mimetype_inner": null, | ||||
224 | "name": "Evaluation Dataset", | ||||
225 | "package_id": "36f85159-319d-4244-abff-69dc9dbb393d", | ||||
226 | "position": 5, | ||||
227 | "resource_type": null, | ||||
228 | "rights": "", | ||||
229 | "size": 32592981, | ||||
230 | "state": "active", | ||||
231 | "url": | ||||
232 | bce7e4-0d2d-4b4a-b1d5-136f13143a40/download/eval_dataset_final.jsonl", | ||||
233 | "url_type": "upload" | ||||
207 | } | 234 | } | ||
208 | ], | 235 | ], | ||
209 | "services_used_list": "", | 236 | "services_used_list": "", | ||
210 | "spatial": "", | 237 | "spatial": "", | ||
211 | "spatial_resolution": "", | 238 | "spatial_resolution": "", | ||
212 | "start_date": "", | 239 | "start_date": "", | ||
213 | "state": "active", | 240 | "state": "active", | ||
214 | "tags": [], | 241 | "tags": [], | ||
215 | "temporal_resolution": "", | 242 | "temporal_resolution": "", | ||
216 | "title": "Pipeline for Arabic Legal Text Summarization Dataset", | 243 | "title": "Pipeline for Arabic Legal Text Summarization Dataset", | ||
217 | "type": "dataset", | 244 | "type": "dataset", | ||
218 | "url": "", | 245 | "url": "", | ||
219 | "version": "", | 246 | "version": "", | ||
220 | "version_note": "" | 247 | "version_note": "" | ||
221 | } | 248 | } |