Changes
On March 4, 2025 at 12:51:05 PM UTC,
-
Changed the license of CLARA-MeD simplified sentences to https://creativecommons.org/licenses/by-nc-sa/4.0/ (previously https://digital.csic.es/handle/10261/346579?mode=full)
-
Changed value of field
autor
to{'en': ['Leonardo Campillos-Llanos'], 'es': ['Leonardo Campillos-Llanos']}
in CLARA-MeD simplified sentences -
Changed value of field
proyecto
to{'es': ['PID2020-116001RA-C33']}
in CLARA-MeD simplified sentences
| f | 1 | { | f | 1 | { |
| 2 | "Observaciones": { | 2 | "Observaciones": { | ||
| 3 | "en": "", | 3 | "en": "", | ||
| 4 | "es": "" | 4 | "es": "" | ||
| 5 | }, | 5 | }, | ||
| 6 | "author": null, | 6 | "author": null, | ||
| 7 | "author_email": null, | 7 | "author_email": null, | ||
| n | 8 | "autor": {}, | n | 8 | "autor": { |
| 9 | "en": [ | ||||
| 10 | "Leonardo Campillos-Llanos" | ||||
| 11 | ], | ||||
| 12 | "es": [ | ||||
| 13 | "Leonardo Campillos-Llanos" | ||||
| 14 | ] | ||||
| 15 | }, | ||||
| 9 | "conforms_to": [], | 16 | "conforms_to": [], | ||
| 10 | "coverage_new": {}, | 17 | "coverage_new": {}, | ||
| 11 | "creator_user_id": "196556b3-e0c4-4c51-a9e6-f51cc752bc37", | 18 | "creator_user_id": "196556b3-e0c4-4c51-a9e6-f51cc752bc37", | ||
| 12 | "description": { | 19 | "description": { | ||
| 13 | "en": "This dataset contains 1200 manually simplified sentences | 20 | "en": "This dataset contains 1200 manually simplified sentences | ||
| 14 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | 21 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | ||
| 15 | announcements from the European Clinical Trials Register (EudraCT) | 22 | announcements from the European Clinical Trials Register (EudraCT) | ||
| 16 | were analyzed to select sentences with ambiguities or exceeding 25 | 23 | were analyzed to select sentences with ambiguities or exceeding 25 | ||
| 17 | words. Simplification criteria were devised in an annotation | 24 | words. Simplification criteria were devised in an annotation | ||
| 18 | guideline, which is released publicly along the dataset.\r\n\r\nThis | 25 | guideline, which is released publicly along the dataset.\r\n\r\nThis | ||
| 19 | resource was collected in the CLARA-MeD project, with the goal of | 26 | resource was collected in the CLARA-MeD project, with the goal of | ||
| 20 | simplifying medical texts in the Spanish language and reduce the | 27 | simplifying medical texts in the Spanish language and reduce the | ||
| 21 | language barrier to patient's informed decision making. In particular, | 28 | language barrier to patient's informed decision making. In particular, | ||
| 22 | the project aims at developing linguistic resources for automatic | 29 | the project aims at developing linguistic resources for automatic | ||
| 23 | medical term simplification in Spanish; and conducting experiments in | 30 | medical term simplification in Spanish; and conducting experiments in | ||
| 24 | automatic text simplification.", | 31 | automatic text simplification.", | ||
| 25 | "es": "This dataset contains 1200 manually simplified sentences | 32 | "es": "This dataset contains 1200 manually simplified sentences | ||
| 26 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | 33 | (144 019 tokens) from clinical trials in Spanish. A total of 1040 | ||
| 27 | announcements from the European Clinical Trials Register (EudraCT) | 34 | announcements from the European Clinical Trials Register (EudraCT) | ||
| 28 | were analyzed to select sentences with ambiguities or exceeding 25 | 35 | were analyzed to select sentences with ambiguities or exceeding 25 | ||
| 29 | words. Simplification criteria were devised in an annotation | 36 | words. Simplification criteria were devised in an annotation | ||
| 30 | guideline, which is released publicly along the dataset.\r\n\r\nThis | 37 | guideline, which is released publicly along the dataset.\r\n\r\nThis | ||
| 31 | resource was collected in the CLARA-MeD project, with the goal of | 38 | resource was collected in the CLARA-MeD project, with the goal of | ||
| 32 | simplifying medical texts in the Spanish language and reduce the | 39 | simplifying medical texts in the Spanish language and reduce the | ||
| 33 | language barrier to patient's informed decision making. In particular, | 40 | language barrier to patient's informed decision making. In particular, | ||
| 34 | the project aims at developing linguistic resources for automatic | 41 | the project aims at developing linguistic resources for automatic | ||
| 35 | medical term simplification in Spanish; and conducting experiments in | 42 | medical term simplification in Spanish; and conducting experiments in | ||
| 36 | automatic text simplification." | 43 | automatic text simplification." | ||
| 37 | }, | 44 | }, | ||
| 38 | "groups": [ | 45 | "groups": [ | ||
| 39 | { | 46 | { | ||
| 40 | "description": "", | 47 | "description": "", | ||
| 41 | "display_name": "Terminolog\u00eda", | 48 | "display_name": "Terminolog\u00eda", | ||
| 42 | "id": "f21d51d4-df60-44f9-ad1f-60f1d5ca24d2", | 49 | "id": "f21d51d4-df60-44f9-ad1f-60f1d5ca24d2", | ||
| 43 | "image_display_url": | 50 | "image_display_url": | ||
| 44 | .cchs.csic.es/uploads/group/2024-09-27-062713.009717Terminologia.png", | 51 | .cchs.csic.es/uploads/group/2024-09-27-062713.009717Terminologia.png", | ||
| 45 | "name": "terminologia", | 52 | "name": "terminologia", | ||
| 46 | "title": "Terminolog\u00eda" | 53 | "title": "Terminolog\u00eda" | ||
| 47 | } | 54 | } | ||
| 48 | ], | 55 | ], | ||
| 49 | "id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 56 | "id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
| 50 | "identifier": "https://doi.org/10.20350/digitalCSIC/16110", | 57 | "identifier": "https://doi.org/10.20350/digitalCSIC/16110", | ||
| 51 | "international_spatial_translated": { | 58 | "international_spatial_translated": { | ||
| 52 | "en": "", | 59 | "en": "", | ||
| 53 | "es": "" | 60 | "es": "" | ||
| 54 | }, | 61 | }, | ||
| 55 | "isopen": false, | 62 | "isopen": false, | ||
| 56 | "issued_date": "2024-02-09T00:00:00", | 63 | "issued_date": "2024-02-09T00:00:00", | ||
| 57 | "language": [ | 64 | "language": [ | ||
| 58 | "es", | 65 | "es", | ||
| 59 | "en" | 66 | "en" | ||
| 60 | ], | 67 | ], | ||
| n | 61 | "license_id": | n | 68 | "license_id": "https://creativecommons.org/licenses/by-nc-sa/4.0/", |
| 62 | "https://digital.csic.es/handle/10261/346579?mode=full", | ||||
| 63 | "license_title": | 69 | "license_title": | ||
| n | 64 | "https://digital.csic.es/handle/10261/346579?mode=full", | n | 70 | "https://creativecommons.org/licenses/by-nc-sa/4.0/", |
| 65 | "maintainer": null, | 71 | "maintainer": null, | ||
| 66 | "maintainer_email": null, | 72 | "maintainer_email": null, | ||
| 67 | "metadata_created": "2024-05-30T15:57:14.431217", | 73 | "metadata_created": "2024-05-30T15:57:14.431217", | ||
| n | 68 | "metadata_modified": "2025-03-03T16:20:42.026335", | n | 74 | "metadata_modified": "2025-03-04T12:51:05.028495", |
| 69 | "multilingual_tags": { | 75 | "multilingual_tags": { | ||
| 70 | "en": [ | 76 | "en": [ | ||
| 71 | "Biomedical natural language processing", | 77 | "Biomedical natural language processing", | ||
| 72 | "Parallel sentences", | 78 | "Parallel sentences", | ||
| 73 | "Medical text simplification" | 79 | "Medical text simplification" | ||
| 74 | ] | 80 | ] | ||
| 75 | }, | 81 | }, | ||
| 76 | "name": "clara-med-simplified-sentences", | 82 | "name": "clara-med-simplified-sentences", | ||
| 77 | "notes": null, | 83 | "notes": null, | ||
| 78 | "num_resources": 3, | 84 | "num_resources": 3, | ||
| 79 | "num_tags": 0, | 85 | "num_tags": 0, | ||
| 80 | "organization": { | 86 | "organization": { | ||
| 81 | "approval_status": "approved", | 87 | "approval_status": "approved", | ||
| 82 | "created": "2023-09-25T12:13:42.172869", | 88 | "created": "2023-09-25T12:13:42.172869", | ||
| 83 | "description": "El Instituto de Lengua, Literatura y | 89 | "description": "El Instituto de Lengua, Literatura y | ||
| 84 | Antropolog\u00eda, ILLA (CSIC) tiene como objetivo primordial la | 90 | Antropolog\u00eda, ILLA (CSIC) tiene como objetivo primordial la | ||
| 85 | investigaci\u00f3n del patrimonio cultural hisp\u00e1nico en su triple | 91 | investigaci\u00f3n del patrimonio cultural hisp\u00e1nico en su triple | ||
| 86 | dimensi\u00f3n antropol\u00f3gica, ling\u00fc\u00edstica y | 92 | dimensi\u00f3n antropol\u00f3gica, ling\u00fc\u00edstica y | ||
| 87 | literaria.", | 93 | literaria.", | ||
| 88 | "id": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | 94 | "id": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | ||
| 89 | "image_url": "2023-09-25-101342.167134illa0.png", | 95 | "image_url": "2023-09-25-101342.167134illa0.png", | ||
| 90 | "is_organization": true, | 96 | "is_organization": true, | ||
| 91 | "name": "instituto-de-lengua-literatura-y-antropologia-illa-csic", | 97 | "name": "instituto-de-lengua-literatura-y-antropologia-illa-csic", | ||
| 92 | "state": "active", | 98 | "state": "active", | ||
| 93 | "title": "Instituto de Lengua, Literatura y Antropolog\u00eda | 99 | "title": "Instituto de Lengua, Literatura y Antropolog\u00eda | ||
| 94 | (ILLA), CSIC", | 100 | (ILLA), CSIC", | ||
| 95 | "type": "organization" | 101 | "type": "organization" | ||
| 96 | }, | 102 | }, | ||
| 97 | "owner_org": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | 103 | "owner_org": "fc47e531-a165-4eac-8fc7-34342a3a38ff", | ||
| 98 | "private": false, | 104 | "private": false, | ||
| t | 99 | "proyecto": {}, | t | 105 | "proyecto": { |
| 106 | "es": [ | ||||
| 107 | "PID2020-116001RA-C33" | ||||
| 108 | ] | ||||
| 109 | }, | ||||
| 100 | "publisher": "b627d71d-2315-4e75-afc9-897da84459f0", | 110 | "publisher": "b627d71d-2315-4e75-afc9-897da84459f0", | ||
| 101 | "reference": [], | 111 | "reference": [], | ||
| 102 | "relationships_as_object": [], | 112 | "relationships_as_object": [], | ||
| 103 | "relationships_as_subject": [], | 113 | "relationships_as_subject": [], | ||
| 104 | "resources": [ | 114 | "resources": [ | ||
| 105 | { | 115 | { | ||
| 106 | "byte_size": "7,32 kB", | 116 | "byte_size": "7,32 kB", | ||
| 107 | "cache_last_updated": null, | 117 | "cache_last_updated": null, | ||
| 108 | "cache_url": null, | 118 | "cache_url": null, | ||
| 109 | "created": "2024-05-30T15:58:24.249419", | 119 | "created": "2024-05-30T15:58:24.249419", | ||
| 110 | "datastore_active": false, | 120 | "datastore_active": false, | ||
| 111 | "description": null, | 121 | "description": null, | ||
| 112 | "format": "txt", | 122 | "format": "txt", | ||
| 113 | "hash": "", | 123 | "hash": "", | ||
| 114 | "id": "30dfbb45-e41a-4c6e-bcdc-a4af2f040715", | 124 | "id": "30dfbb45-e41a-4c6e-bcdc-a4af2f040715", | ||
| 115 | "last_modified": null, | 125 | "last_modified": null, | ||
| 116 | "metadata_modified": "2024-05-30T15:58:24.421759", | 126 | "metadata_modified": "2024-05-30T15:58:24.421759", | ||
| 117 | "mimetype": "text/plain", | 127 | "mimetype": "text/plain", | ||
| 118 | "mimetype_inner": null, | 128 | "mimetype_inner": null, | ||
| 119 | "name": "README_CLARAMED_sentences.txt\t", | 129 | "name": "README_CLARAMED_sentences.txt\t", | ||
| 120 | "name_translated": { | 130 | "name_translated": { | ||
| 121 | "en": "README_CLARAMED_sentences.txt\t", | 131 | "en": "README_CLARAMED_sentences.txt\t", | ||
| 122 | "es": "README_CLARAMED_sentences.txt\t" | 132 | "es": "README_CLARAMED_sentences.txt\t" | ||
| 123 | }, | 133 | }, | ||
| 124 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 134 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
| 125 | "position": 0, | 135 | "position": 0, | ||
| 126 | "resource_identifier": "", | 136 | "resource_identifier": "", | ||
| 127 | "resource_relation": [], | 137 | "resource_relation": [], | ||
| 128 | "resource_relation-1": "", | 138 | "resource_relation-1": "", | ||
| 129 | "resource_type": null, | 139 | "resource_type": null, | ||
| 130 | "size": null, | 140 | "size": null, | ||
| 131 | "state": "active", | 141 | "state": "active", | ||
| 132 | "url": | 142 | "url": | ||
| 133 | gital.csic.es/bitstream/10261/346579/6/README_CLARAMED_sentences.txt", | 143 | gital.csic.es/bitstream/10261/346579/6/README_CLARAMED_sentences.txt", | ||
| 134 | "url_type": null | 144 | "url_type": null | ||
| 135 | }, | 145 | }, | ||
| 136 | { | 146 | { | ||
| 137 | "byte_size": "981,11 kB", | 147 | "byte_size": "981,11 kB", | ||
| 138 | "cache_last_updated": null, | 148 | "cache_last_updated": null, | ||
| 139 | "cache_url": null, | 149 | "cache_url": null, | ||
| 140 | "created": "2024-05-30T15:57:45.357301", | 150 | "created": "2024-05-30T15:57:45.357301", | ||
| 141 | "datastore_active": false, | 151 | "datastore_active": false, | ||
| 142 | "description": null, | 152 | "description": null, | ||
| 143 | "format": "tsv", | 153 | "format": "tsv", | ||
| 144 | "hash": "", | 154 | "hash": "", | ||
| 145 | "id": "a05fd101-9c06-4312-bb30-13f6ea008d46", | 155 | "id": "a05fd101-9c06-4312-bb30-13f6ea008d46", | ||
| 146 | "last_modified": null, | 156 | "last_modified": null, | ||
| 147 | "metadata_modified": "2024-05-30T15:58:24.247167", | 157 | "metadata_modified": "2024-05-30T15:58:24.247167", | ||
| 148 | "mimetype": "text/tab-separated-values", | 158 | "mimetype": "text/tab-separated-values", | ||
| 149 | "mimetype_inner": null, | 159 | "mimetype_inner": null, | ||
| 150 | "name": "Dataset | 160 | "name": "Dataset | ||
| 151 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 161 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
| 152 | "name_translated": { | 162 | "name_translated": { | ||
| 153 | "en": "Dataset | 163 | "en": "Dataset | ||
| 154 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 164 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
| 155 | "es": "Dataset | 165 | "es": "Dataset | ||
| 156 | gital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv" | 166 | gital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv" | ||
| 157 | }, | 167 | }, | ||
| 158 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 168 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
| 159 | "position": 1, | 169 | "position": 1, | ||
| 160 | "resource_identifier": "", | 170 | "resource_identifier": "", | ||
| 161 | "resource_relation": [], | 171 | "resource_relation": [], | ||
| 162 | "resource_relation-1": "", | 172 | "resource_relation-1": "", | ||
| 163 | "resource_type": null, | 173 | "resource_type": null, | ||
| 164 | "size": null, | 174 | "size": null, | ||
| 165 | "state": "active", | 175 | "state": "active", | ||
| 166 | "url": | 176 | "url": | ||
| 167 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | 177 | ital.csic.es/bitstream/10261/346579/1/claramed_synt_simp_aligned.tsv", | ||
| 168 | "url_type": null | 178 | "url_type": null | ||
| 169 | }, | 179 | }, | ||
| 170 | { | 180 | { | ||
| 171 | "byte_size": "757,92 kB", | 181 | "byte_size": "757,92 kB", | ||
| 172 | "cache_last_updated": null, | 182 | "cache_last_updated": null, | ||
| 173 | "cache_url": null, | 183 | "cache_url": null, | ||
| 174 | "created": "2024-05-30T15:59:20.596413", | 184 | "created": "2024-05-30T15:59:20.596413", | ||
| 175 | "datastore_active": false, | 185 | "datastore_active": false, | ||
| 176 | "description": null, | 186 | "description": null, | ||
| 177 | "format": "pdf", | 187 | "format": "pdf", | ||
| 178 | "hash": "", | 188 | "hash": "", | ||
| 179 | "id": "a1f5a665-35a0-4513-8123-8e3feed8c66b", | 189 | "id": "a1f5a665-35a0-4513-8123-8e3feed8c66b", | ||
| 180 | "last_modified": null, | 190 | "last_modified": null, | ||
| 181 | "metadata_modified": "2024-05-30T15:59:40.961858", | 191 | "metadata_modified": "2024-05-30T15:59:40.961858", | ||
| 182 | "mimetype": "application/pdf", | 192 | "mimetype": "application/pdf", | ||
| 183 | "mimetype_inner": null, | 193 | "mimetype_inner": null, | ||
| 184 | "name": "Guideline CLARA-MeD_simplif_guideline.pdf", | 194 | "name": "Guideline CLARA-MeD_simplif_guideline.pdf", | ||
| 185 | "name_translated": { | 195 | "name_translated": { | ||
| 186 | "en": "Guideline CLARA-MeD_simplif_guideline.pdf", | 196 | "en": "Guideline CLARA-MeD_simplif_guideline.pdf", | ||
| 187 | "es": "Guideline CLARA-MeD_simplif_guideline.pdf" | 197 | "es": "Guideline CLARA-MeD_simplif_guideline.pdf" | ||
| 188 | }, | 198 | }, | ||
| 189 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | 199 | "package_id": "73cc4b2b-f43c-4efd-9d6d-113bc923cd77", | ||
| 190 | "position": 2, | 200 | "position": 2, | ||
| 191 | "resource_identifier": "", | 201 | "resource_identifier": "", | ||
| 192 | "resource_relation": [], | 202 | "resource_relation": [], | ||
| 193 | "resource_relation-1": "", | 203 | "resource_relation-1": "", | ||
| 194 | "resource_type": null, | 204 | "resource_type": null, | ||
| 195 | "size": null, | 205 | "size": null, | ||
| 196 | "state": "active", | 206 | "state": "active", | ||
| 197 | "url": | 207 | "url": | ||
| 198 | tal.csic.es/bitstream/10261/346579/2/CLARA-MeD_simplif_guideline.pdf", | 208 | tal.csic.es/bitstream/10261/346579/2/CLARA-MeD_simplif_guideline.pdf", | ||
| 199 | "url_type": null | 209 | "url_type": null | ||
| 200 | } | 210 | } | ||
| 201 | ], | 211 | ], | ||
| 202 | "spatial": [], | 212 | "spatial": [], | ||
| 203 | "state": "active", | 213 | "state": "active", | ||
| 204 | "tags": [], | 214 | "tags": [], | ||
| 205 | "theme": [ | 215 | "theme": [ | ||
| 206 | 216 | ||||
| 207 | "http://datos.gob.es/kos/sector-publico/sector/ciencia-tecnologia", | 217 | "http://datos.gob.es/kos/sector-publico/sector/ciencia-tecnologia", | ||
| 208 | "http://datos.gob.es/kos/sector-publico/sector/salud", | 218 | "http://datos.gob.es/kos/sector-publico/sector/salud", | ||
| 209 | "http://datos.gob.es/kos/sector-publico/sector/sector-publico" | 219 | "http://datos.gob.es/kos/sector-publico/sector/sector-publico" | ||
| 210 | ], | 220 | ], | ||
| 211 | "title": "CLARA-MeD simplified sentences", | 221 | "title": "CLARA-MeD simplified sentences", | ||
| 212 | "title_translated": { | 222 | "title_translated": { | ||
| 213 | "en": "CLARA-MeD simplified sentences", | 223 | "en": "CLARA-MeD simplified sentences", | ||
| 214 | "es": "CLARA-MeD simplified sentences" | 224 | "es": "CLARA-MeD simplified sentences" | ||
| 215 | }, | 225 | }, | ||
| 216 | "type": "dataset", | 226 | "type": "dataset", | ||
| 217 | "url": null, | 227 | "url": null, | ||
| 218 | "version": null | 228 | "version": null | ||
| 219 | } | 229 | } |
