ctrlnum 0.17632-fwc7jrc5jr.1
fullrecord <?xml version="1.0"?> <dc><creator>Moreno, Isabel</creator><title>DrugSemantics Gold Standard</title><publisher>Mendeley</publisher><description>DrugSemantics gold standard consists of 5 Summaries of Product Characteristics (SPC) written in Spanish. SPCs were retrieved from Medicines Online Information Center - CIMA - that belongs to the Spanish Agency for Medicines and Health Products - AEMPS. This corpus is annotated with 10 Named Entities (NE) related to pharmacotherapeutic care, namely: Chemical Composition, Disease, Drug, Excipient, Food, Medicament, Pharmaceutical Form, Route, Therapeutic Action and Unit of Measurement. It contains 2241 ENs, 780 sentences and 226,729 tokens. The zip file is organized as follows: Each SPC is in a separte folder containing one xml file that contains the annotated documents in Gate Standoff format. DrugSemantics was designed to be used for developing and testesting of Spanish NE recogniton tools in the pharmacotherapeutic domain. </description><subject>Drugs</subject><subject>Disease</subject><subject>Annotation</subject><subject>Natural Language Processing</subject><subject>Information Extraction</subject><subject>Chemical Compound</subject><subject>Spanish Language</subject><subject>Human Language Resources</subject><subject>Excipient</subject><subject>Medication</subject><contributor>Boldrini, Ester</contributor><contributor>Moreda, Paloma</contributor><contributor>Rom&#xE1;-Ferri, M. Teresa</contributor><type>Other:Dataset</type><identifier>10.17632/fwc7jrc5jr.1</identifier><rights>Attribution-NonCommercial 3.0 Unported</rights><rights>https://creativecommons.org/licenses/by-nc/3.0</rights><relation>https:/data.mendeley.com/datasets/fwc7jrc5jr</relation><date>2017-06-16T20:31:11Z</date><recordID>0.17632-fwc7jrc5jr.1</recordID></dc>
format Other:Dataset
Other
author Moreno, Isabel
author2 Boldrini, Ester
Moreda, Paloma
Romá-Ferri, M. Teresa
title DrugSemantics Gold Standard
publisher Mendeley
publishDate 2017
topic Drugs
Disease
Annotation
Natural Language Processing
Information Extraction
Chemical Compound
Spanish Language
Human Language Resources
Excipient
Medication
url https:/data.mendeley.com/datasets/fwc7jrc5jr
contents DrugSemantics gold standard consists of 5 Summaries of Product Characteristics (SPC) written in Spanish. SPCs were retrieved from Medicines Online Information Center - CIMA - that belongs to the Spanish Agency for Medicines and Health Products - AEMPS. This corpus is annotated with 10 Named Entities (NE) related to pharmacotherapeutic care, namely: Chemical Composition, Disease, Drug, Excipient, Food, Medicament, Pharmaceutical Form, Route, Therapeutic Action and Unit of Measurement. It contains 2241 ENs, 780 sentences and 226,729 tokens. The zip file is organized as follows: Each SPC is in a separte folder containing one xml file that contains the annotated documents in Gate Standoff format. DrugSemantics was designed to be used for developing and testesting of Spanish NE recogniton tools in the pharmacotherapeutic domain.
id IOS7969.0.17632-fwc7jrc5jr.1
institution Universitas Islam Indragiri
affiliation onesearch.perpusnas.go.id
institution_id 804
institution_type library:university
library
library Teknologi Pangan UNISI
library_id 2816
collection Artikel mulono
repository_id 7969
city INDRAGIRI HILIR
province RIAU
shared_to_ipusnas_str 1
repoId IOS7969
first_indexed 2020-04-08T08:27:50Z
last_indexed 2020-04-08T08:27:50Z
recordtype dc
_version_ 1686587742307221504
score 17.538404