Cambios
En el instante 30 de mayo de 2024, 16:05:15 UTC, Administrador CKAN:
-
Modificado el valor del campo
multilingual_tags
a{'en': ['Biomedical natural language processing', 'Parallel sentences', 'Medical text simplification']}
en CLARA-MeD simplified sentences
f | 1 | { | f | 1 | { |
2 | "author": null, | 2 | "author": null, | ||
3 | "author_email": null, | 3 | "author_email": null, | ||
4 | "conforms_to": [], | 4 | "conforms_to": [], | ||
5 | "coverage_new": {}, | 5 | "coverage_new": {}, | ||
6 | "creator_user_id": "196556b3-e0c4-4c51-a9e6-f51cc752bc37", | 6 | "creator_user_id": "196556b3-e0c4-4c51-a9e6-f51cc752bc37", | ||
7 | "description": { | 7 | "description": { | ||
8 | "en": "This dataset contains 1200 manually simplified sentences | 8 | "en": "This dataset contains 1200 manually simplified sentences | ||
9 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | 9 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | ||
10 | announcements from the European Clinical Trials Register (EudraCT) | 10 | announcements from the European Clinical Trials Register (EudraCT) | ||
11 | were analyzed to select sentences with ambiguities or exceeding 25 | 11 | were analyzed to select sentences with ambiguities or exceeding 25 | ||
12 | words. Simplification criteria were devised in an annotation | 12 | words. Simplification criteria were devised in an annotation | ||
13 | guideline, which is released publicly along the dataset.\r\n\r\nThis | 13 | guideline, which is released publicly along the dataset.\r\n\r\nThis | ||
14 | resource was collected in the CLARA-MeD project, with the goal of | 14 | resource was collected in the CLARA-MeD project, with the goal of | ||
15 | simplifying medical texts in the Spanish language and reduce the | 15 | simplifying medical texts in the Spanish language and reduce the | ||
16 | language barrier to patient's informed decision making. In particular, | 16 | language barrier to patient's informed decision making. In particular, | ||
17 | the project aims at developing linguistic resources for automatic | 17 | the project aims at developing linguistic resources for automatic | ||
18 | medical term simplification in Spanish; and conducting experiments in | 18 | medical term simplification in Spanish; and conducting experiments in | ||
19 | automatic text simplification.", | 19 | automatic text simplification.", | ||
20 | "es": "This dataset contains 1200 manually simplified sentences | 20 | "es": "This dataset contains 1200 manually simplified sentences | ||
21 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | 21 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | ||
22 | announcements from the European Clinical Trials Register (EudraCT) | 22 | announcements from the European Clinical Trials Register (EudraCT) | ||
23 | were analyzed to select sentences with ambiguities or exceeding 25 | 23 | were analyzed to select sentences with ambiguities or exceeding 25 | ||
24 | words. Simplification criteria were devised in an annotation | 24 | words. Simplification criteria were devised in an annotation | ||
25 | guideline, which is released publicly along the dataset.\r\n\r\nThis | 25 | guideline, which is released publicly along the dataset.\r\n\r\nThis | ||
26 | resource was collected in the CLARA-MeD project, with the goal of | 26 | resource was collected in the CLARA-MeD project, with the goal of | ||
27 | simplifying medical texts in the Spanish language and reduce the | 27 | simplifying medical texts in the Spanish language and reduce the | ||
28 | language barrier to patient's informed decision making. In particular, | 28 | language barrier to patient's informed decision making. In particular, | ||
29 | the project aims at developing linguistic resources for automatic | 29 | the project aims at developing linguistic resources for automatic | ||
30 | medical term simplification in Spanish; and conducting experiments in | 30 | medical term simplification in Spanish; and conducting experiments in | ||
31 | automatic text simplification." | 31 | automatic text simplification." | ||
32 | }, | 32 | }, | ||
33 | "groups": [], | 33 | "groups": [], | ||
34 | "id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 34 | "id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
35 | "identifier": "https://doi.org/10.20350/digitalCSIC/16110", | 35 | "identifier": "https://doi.org/10.20350/digitalCSIC/16110", | ||
36 | "isopen": false, | 36 | "isopen": false, | ||
37 | "issued_date": "2024-02-09T00:00:00", | 37 | "issued_date": "2024-02-09T00:00:00", | ||
38 | "language": [ | 38 | "language": [ | ||
39 | "es", | 39 | "es", | ||
40 | "en" | 40 | "en" | ||
41 | ], | 41 | ], | ||
42 | "license_id": | 42 | "license_id": | ||
43 | "https://digital.csic.es/handle/10261/346579?mode=full", | 43 | "https://digital.csic.es/handle/10261/346579?mode=full", | ||
44 | "license_title": | 44 | "license_title": | ||
45 | "https://digital.csic.es/handle/10261/346579?mode=full", | 45 | "https://digital.csic.es/handle/10261/346579?mode=full", | ||
46 | "maintainer": null, | 46 | "maintainer": null, | ||
47 | "maintainer_email": null, | 47 | "maintainer_email": null, | ||
48 | "metadata_created": "2024-05-30T15:57:14.431217", | 48 | "metadata_created": "2024-05-30T15:57:14.431217", | ||
n | 49 | "metadata_modified": "2024-05-30T15:59:40.959695", | n | 49 | "metadata_modified": "2024-05-30T16:05:15.774184", |
50 | "multilingual_tags": { | 50 | "multilingual_tags": { | ||
51 | "en": [ | 51 | "en": [ | ||
t | 52 | "Biomedical natural language processing", | t | ||
53 | "Parallel sentences", | ||||
54 | "Medical text simplification" | ||||
55 | ], | ||||
56 | "es": [ | ||||
57 | "Biomedical natural language processing", | 52 | "Biomedical natural language processing", | ||
58 | "Parallel sentences", | 53 | "Parallel sentences", | ||
59 | "Medical text simplification" | 54 | "Medical text simplification" | ||
60 | ] | 55 | ] | ||
61 | }, | 56 | }, | ||
62 | "name": "clara-med-simplified-sentences", | 57 | "name": "clara-med-simplified-sentences", | ||
63 | "notes": null, | 58 | "notes": null, | ||
64 | "num_resources": 3, | 59 | "num_resources": 3, | ||
65 | "num_tags": 0, | 60 | "num_tags": 0, | ||
66 | "organization": { | 61 | "organization": { | ||
67 | "approval_status": "approved", | 62 | "approval_status": "approved", | ||
68 | "created": "2023-09-25T12:13:42.172869", | 63 | "created": "2023-09-25T12:13:42.172869", | ||
69 | "description": "El Instituto de Lengua, Literatura y | 64 | "description": "El Instituto de Lengua, Literatura y | ||
70 | Antropolog\u00eda, ILLA (CSIC) tiene como objetivo primordial la | 65 | Antropolog\u00eda, ILLA (CSIC) tiene como objetivo primordial la | ||
71 | investigaci\u00f3n del patrimonio cultural hisp\u00e1nico en su triple | 66 | investigaci\u00f3n del patrimonio cultural hisp\u00e1nico en su triple | ||
72 | dimensi\u00f3n antropol\u00f3gica, ling\u00fc\u00edstica y | 67 | dimensi\u00f3n antropol\u00f3gica, ling\u00fc\u00edstica y | ||
73 | literaria.", | 68 | literaria.", | ||
74 | "id": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | 69 | "id": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | ||
75 | "image_url": "2023-09-25-101342.167134illa0.png", | 70 | "image_url": "2023-09-25-101342.167134illa0.png", | ||
76 | "is_organization": true, | 71 | "is_organization": true, | ||
77 | "name": "instituto-de-lengua-literatura-y-antropologia-illa-csic", | 72 | "name": "instituto-de-lengua-literatura-y-antropologia-illa-csic", | ||
78 | "state": "active", | 73 | "state": "active", | ||
79 | "title": "Instituto de Lengua, Literatura y Antropolog\u00eda | 74 | "title": "Instituto de Lengua, Literatura y Antropolog\u00eda | ||
80 | (ILLA), CSIC", | 75 | (ILLA), CSIC", | ||
81 | "type": "organization" | 76 | "type": "organization" | ||
82 | }, | 77 | }, | ||
83 | "owner_org": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | 78 | "owner_org": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | ||
84 | "private": false, | 79 | "private": false, | ||
85 | "publisher": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | 80 | "publisher": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | ||
86 | "reference": [], | 81 | "reference": [], | ||
87 | "relationships_as_object": [], | 82 | "relationships_as_object": [], | ||
88 | "relationships_as_subject": [], | 83 | "relationships_as_subject": [], | ||
89 | "resources": [ | 84 | "resources": [ | ||
90 | { | 85 | { | ||
91 | "byte_size": "981,11 kB", | 86 | "byte_size": "981,11 kB", | ||
92 | "cache_last_updated": null, | 87 | "cache_last_updated": null, | ||
93 | "cache_url": null, | 88 | "cache_url": null, | ||
94 | "created": "2024-05-30T15:57:45.357301", | 89 | "created": "2024-05-30T15:57:45.357301", | ||
95 | "datastore_active": false, | 90 | "datastore_active": false, | ||
96 | "description": null, | 91 | "description": null, | ||
97 | "format": "tsv", | 92 | "format": "tsv", | ||
98 | "hash": "", | 93 | "hash": "", | ||
99 | "id": "a05fd101-9c06-4312-bb30-13f6ea008d46", | 94 | "id": "a05fd101-9c06-4312-bb30-13f6ea008d46", | ||
100 | "last_modified": null, | 95 | "last_modified": null, | ||
101 | "metadata_modified": "2024-05-30T15:58:24.247167", | 96 | "metadata_modified": "2024-05-30T15:58:24.247167", | ||
102 | "mimetype": "text/tab-separated-values", | 97 | "mimetype": "text/tab-separated-values", | ||
103 | "mimetype_inner": null, | 98 | "mimetype_inner": null, | ||
104 | "name": "Dataset | 99 | "name": "Dataset | ||
105 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 100 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
106 | "name_translated": { | 101 | "name_translated": { | ||
107 | "en": "Dataset | 102 | "en": "Dataset | ||
108 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 103 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
109 | "es": "Dataset | 104 | "es": "Dataset | ||
110 | gital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv" | 105 | gital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv" | ||
111 | }, | 106 | }, | ||
112 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 107 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
113 | "position": 0, | 108 | "position": 0, | ||
114 | "resource_identifier": "", | 109 | "resource_identifier": "", | ||
115 | "resource_relation": [], | 110 | "resource_relation": [], | ||
116 | "resource_relation-1": "", | 111 | "resource_relation-1": "", | ||
117 | "resource_type": null, | 112 | "resource_type": null, | ||
118 | "size": null, | 113 | "size": null, | ||
119 | "state": "active", | 114 | "state": "active", | ||
120 | "url": | 115 | "url": | ||
121 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 116 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
122 | "url_type": null | 117 | "url_type": null | ||
123 | }, | 118 | }, | ||
124 | { | 119 | { | ||
125 | "byte_size": "757,92 kB", | 120 | "byte_size": "757,92 kB", | ||
126 | "cache_last_updated": null, | 121 | "cache_last_updated": null, | ||
127 | "cache_url": null, | 122 | "cache_url": null, | ||
128 | "created": "2024-05-30T15:59:20.596413", | 123 | "created": "2024-05-30T15:59:20.596413", | ||
129 | "datastore_active": false, | 124 | "datastore_active": false, | ||
130 | "description": null, | 125 | "description": null, | ||
131 | "format": "pdf", | 126 | "format": "pdf", | ||
132 | "hash": "", | 127 | "hash": "", | ||
133 | "id": "a1f5a665-35a0-4513-8123-8e3feed8c66b", | 128 | "id": "a1f5a665-35a0-4513-8123-8e3feed8c66b", | ||
134 | "last_modified": null, | 129 | "last_modified": null, | ||
135 | "metadata_modified": "2024-05-30T15:59:40.961858", | 130 | "metadata_modified": "2024-05-30T15:59:40.961858", | ||
136 | "mimetype": "application/pdf", | 131 | "mimetype": "application/pdf", | ||
137 | "mimetype_inner": null, | 132 | "mimetype_inner": null, | ||
138 | "name": "Guideline CLARA-MeD_simplif_guideline.pdf", | 133 | "name": "Guideline CLARA-MeD_simplif_guideline.pdf", | ||
139 | "name_translated": { | 134 | "name_translated": { | ||
140 | "en": "Guideline CLARA-MeD_simplif_guideline.pdf", | 135 | "en": "Guideline CLARA-MeD_simplif_guideline.pdf", | ||
141 | "es": "Guideline CLARA-MeD_simplif_guideline.pdf" | 136 | "es": "Guideline CLARA-MeD_simplif_guideline.pdf" | ||
142 | }, | 137 | }, | ||
143 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 138 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
144 | "position": 1, | 139 | "position": 1, | ||
145 | "resource_identifier": "", | 140 | "resource_identifier": "", | ||
146 | "resource_relation": [], | 141 | "resource_relation": [], | ||
147 | "resource_relation-1": "", | 142 | "resource_relation-1": "", | ||
148 | "resource_type": null, | 143 | "resource_type": null, | ||
149 | "size": null, | 144 | "size": null, | ||
150 | "state": "active", | 145 | "state": "active", | ||
151 | "url": | 146 | "url": | ||
152 | tal.csic.es/bitstream/10261/346579/2/CLARA-MeD_simplif_guideline.pdf", | 147 | tal.csic.es/bitstream/10261/346579/2/CLARA-MeD_simplif_guideline.pdf", | ||
153 | "url_type": null | 148 | "url_type": null | ||
154 | }, | 149 | }, | ||
155 | { | 150 | { | ||
156 | "byte_size": "7,32 kB", | 151 | "byte_size": "7,32 kB", | ||
157 | "cache_last_updated": null, | 152 | "cache_last_updated": null, | ||
158 | "cache_url": null, | 153 | "cache_url": null, | ||
159 | "created": "2024-05-30T15:58:24.249419", | 154 | "created": "2024-05-30T15:58:24.249419", | ||
160 | "datastore_active": false, | 155 | "datastore_active": false, | ||
161 | "description": null, | 156 | "description": null, | ||
162 | "format": "txt", | 157 | "format": "txt", | ||
163 | "hash": "", | 158 | "hash": "", | ||
164 | "id": "30dfbb45-e41a-4c6e-bcdc-a4af2f040715", | 159 | "id": "30dfbb45-e41a-4c6e-bcdc-a4af2f040715", | ||
165 | "last_modified": null, | 160 | "last_modified": null, | ||
166 | "metadata_modified": "2024-05-30T15:58:24.421759", | 161 | "metadata_modified": "2024-05-30T15:58:24.421759", | ||
167 | "mimetype": "text/plain", | 162 | "mimetype": "text/plain", | ||
168 | "mimetype_inner": null, | 163 | "mimetype_inner": null, | ||
169 | "name": "README_CLARAMED_sentences.txt\t", | 164 | "name": "README_CLARAMED_sentences.txt\t", | ||
170 | "name_translated": { | 165 | "name_translated": { | ||
171 | "en": "README_CLARAMED_sentences.txt\t", | 166 | "en": "README_CLARAMED_sentences.txt\t", | ||
172 | "es": "README_CLARAMED_sentences.txt\t" | 167 | "es": "README_CLARAMED_sentences.txt\t" | ||
173 | }, | 168 | }, | ||
174 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 169 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
175 | "position": 2, | 170 | "position": 2, | ||
176 | "resource_identifier": "", | 171 | "resource_identifier": "", | ||
177 | "resource_relation": [], | 172 | "resource_relation": [], | ||
178 | "resource_relation-1": "", | 173 | "resource_relation-1": "", | ||
179 | "resource_type": null, | 174 | "resource_type": null, | ||
180 | "size": null, | 175 | "size": null, | ||
181 | "state": "active", | 176 | "state": "active", | ||
182 | "url": | 177 | "url": | ||
183 | gital.csic.es/bitstream/10261/346579/6/README_CLARAMED_sentences.txt", | 178 | gital.csic.es/bitstream/10261/346579/6/README_CLARAMED_sentences.txt", | ||
184 | "url_type": null | 179 | "url_type": null | ||
185 | } | 180 | } | ||
186 | ], | 181 | ], | ||
187 | "spatial": [], | 182 | "spatial": [], | ||
188 | "state": "active", | 183 | "state": "active", | ||
189 | "tags": [], | 184 | "tags": [], | ||
190 | "theme": [ | 185 | "theme": [ | ||
191 | 186 | ||||
192 | "http://datos.gob.es/kos/sector-publico/sector/ciencia-tecnologia", | 187 | "http://datos.gob.es/kos/sector-publico/sector/ciencia-tecnologia", | ||
193 | "http://datos.gob.es/kos/sector-publico/sector/cultura-ocio", | 188 | "http://datos.gob.es/kos/sector-publico/sector/cultura-ocio", | ||
194 | "http://datos.gob.es/kos/sector-publico/sector/educacion", | 189 | "http://datos.gob.es/kos/sector-publico/sector/educacion", | ||
195 | "http://datos.gob.es/kos/sector-publico/sector/salud", | 190 | "http://datos.gob.es/kos/sector-publico/sector/salud", | ||
196 | "http://datos.gob.es/kos/sector-publico/sector/sector-publico" | 191 | "http://datos.gob.es/kos/sector-publico/sector/sector-publico" | ||
197 | ], | 192 | ], | ||
198 | "title": "CLARA-MeD simplified sentences", | 193 | "title": "CLARA-MeD simplified sentences", | ||
199 | "title_translated": { | 194 | "title_translated": { | ||
200 | "en": "CLARA-MeD simplified sentences", | 195 | "en": "CLARA-MeD simplified sentences", | ||
201 | "es": "CLARA-MeD simplified sentences" | 196 | "es": "CLARA-MeD simplified sentences" | ||
202 | }, | 197 | }, | ||
203 | "type": "dataset", | 198 | "type": "dataset", | ||
204 | "url": null, | 199 | "url": null, | ||
205 | "version": null | 200 | "version": null | ||
206 | } | 201 | } |