<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Overview of the eHealth Knowledge Discovery Challenge at IberLEF 2020</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Alejandro</forename><surname>Piad-Morffis</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">School of Math and Computer Science</orgName>
								<orgName type="institution">University of Havana</orgName>
								<address>
									<addrLine>La Habana</addrLine>
									<postCode>10400</postCode>
									<country key="CU">Cuba</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Yoan</forename><surname>Gutiérrez</surname></persName>
							<affiliation key="aff1">
								<orgName type="department">Department of Language and Computing Systems</orgName>
								<orgName type="institution">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff2">
								<orgName type="institution" key="instit1">University Institute for Computing Research</orgName>
								<orgName type="institution" key="instit2">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Hian</forename><surname>Cañizares-Diaz</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">School of Math and Computer Science</orgName>
								<orgName type="institution">University of Havana</orgName>
								<address>
									<addrLine>La Habana</addrLine>
									<postCode>10400</postCode>
									<country key="CU">Cuba</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Suilan</forename><surname>Estévez-Velarde</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">School of Math and Computer Science</orgName>
								<orgName type="institution">University of Havana</orgName>
								<address>
									<addrLine>La Habana</addrLine>
									<postCode>10400</postCode>
									<country key="CU">Cuba</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Rafael</forename><surname>Muñoz</surname></persName>
							<affiliation key="aff1">
								<orgName type="department">Department of Language and Computing Systems</orgName>
								<orgName type="institution">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff2">
								<orgName type="institution" key="instit1">University Institute for Computing Research</orgName>
								<orgName type="institution" key="instit2">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Andrés</forename><surname>Montoyo</surname></persName>
							<affiliation key="aff1">
								<orgName type="department">Department of Language and Computing Systems</orgName>
								<orgName type="institution">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff2">
								<orgName type="institution" key="instit1">University Institute for Computing Research</orgName>
								<orgName type="institution" key="instit2">University of Alicante</orgName>
								<address>
									<postCode>03690</postCode>
									<settlement>Alicante</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Yudivian</forename><surname>Almeida-Cruz</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">School of Math and Computer Science</orgName>
								<orgName type="institution">University of Havana</orgName>
								<address>
									<addrLine>La Habana</addrLine>
									<postCode>10400</postCode>
									<country key="CU">Cuba</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Overview of the eHealth Knowledge Discovery Challenge at IberLEF 2020</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">325C3EB21B14A37CCE19C1520E86DD04</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-03-24T04:20+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>eHealth</term>
					<term>Knowledge Discovery</term>
					<term>Natural Language Processing</term>
					<term>Machine Learning</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>This paper summarises the results of the third edition of the eHealth Knowledge Discovery (KD) challenge, hosted at the Iberian Language Evaluation Forum 2020. The eHealth-KD challenge proposes two computational tasks involving the identification of semantic entities and relations in natural language text, focusing on Spanish language health documents. In this edition, besides text extracted from medical sources, Wikipedia content was introduced into the corpus, and a novel transfer-learning evaluation scenario was designed that challenges participants to create systems that provide crossdomain generalisation. A total of eight teams participated with a variety of approaches including deep learning end-to-end systems as well as rule-based and knowledge-driven techniques. This paper analyses the most successful approaches and highlights the most interesting challenges for future research in this field.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>The vast amount of clinical text available online has motivated the development of automatic knowledge discovery systems that can analyse this data and discover relevant facts. These discoveries can be the base for novel treatments, understanding disease and drug interactions. Computational systems designed for this task are often trained on manually annotated corpora. To foster research in this area, the community has organised competitive challenges to identify, classify, extract, and link knowledge, such as in SEMEVAL <ref type="foot" target="#foot_0">1</ref> and CLEF campaigns <ref type="foot" target="#foot_1">2</ref> .</p><p>Proceedings of the Iberian Languages Evaluation Forum (IberLEF 2020) email: apiad@matcom.uh.cu (A. Piad-Morffis); ygutierrez@dlsi.ua.es (Y. Gutiérrez); hian.canizares@matcom.uh.cu (H. Cañizares-Diaz); sestevez@matcom.uh.cu (S. Estévez-Velarde); rafael@dlsi.ua.es (R. Muñoz); montoyo@dlsi.ua.es (A. Montoyo); yudy@matcom.uh.cu (Y. Almeida-Cruz) orcid: 0000-0001-9522-3239 (A. Piad-Morffis); 0000-0002-4052-7427 (Y. Gutiérrez); 0000-0002-5334-7468 (H. Cañizares-Diaz); 0000-0001-6707-1442 (S. Estévez-Velarde); 0000-0001-8127-9012 (R. Muñoz); 0000-0002-3076-0890 (A. Montoyo); 0000-0002-2345-1387 (Y. Almeida-Cruz)</p><p>The eHealth Knowledge Discovery (eHealth-KD) challenge, in its third edition, leverages a semantic model of human language that encodes the most common expressions of factual knowledge, via a set of four general-purpose entity types and thirteen semantic relations among them. The challenge proposes the design of systems that can automatically annotate entities and relations in clinical text in the Spanish language. In this new edition, an alternative evaluation scenario (not related to the health domain) is also considered, which challenges participants to design systems that can successfully transfer their internal semantic representations from the health domain to an arbitrary new domain with considerably reduced training data. The challenge has been hosted at the Iberian Languages Evaluation Forum 2020, and included the participation of eight teams of researchers from different institutions.</p><p>This paper presents the design of the challenge as well as the data and tools provided to participants, and analyses the results obtained by each team. The remainder of the paper is organised as follows: Section 2 provides a detailed description of the tasks defined in the eHealth-KD challenge and the data provided for training and evaluation of knowledge discovery system, as well as all relevant evaluation metrics. Section 3 briefly describes all the solutions that were submitted to the challenge and introduces a set of characteristics that allow a qualitative comparison among them. Section 4 presents the main results of the challenge, divided into four evaluation scenarios, and analyses the most successful and promising approaches deployed by each team. Finally, Section 5 presents the conclusions of the research and recommendations for future editions.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Challenge description</head><p>The eHealth-KD challenge involves the identification of semantic entities and relations in natural language text. Although the focus has been on the health domain in past editions, the nature of the entities and relations extracted are general and can be applied to any domain. Figure <ref type="figure">1</ref> shows an example of three sentences with the relevant entities and relations annotated. An in-depth explanation of the annotation model is provided in Piad-Morffis et al. <ref type="bibr" target="#b0">[1]</ref>.</p><p>The evaluation of the challenge consists of submitting a set of natural language sentences with annotations automatically produced by a knowledge discovery system. Participants are provided with a set of manually annotated sentences (training and development corpus) that can be used for training and/or fine-tuning system as well as raw sentences that are used for evaluation (test corpus). The training and development corpus was provided two months in advance, but the test corpus was released only two weeks prior to the evaluation date, to discourage any fine-tuning on the test data. Although the actual source code of the system is not required, participants are encouraged to upload their code to open source code sharing services like Github.</p><p>To simplify the evaluation and provide more fine-grained comparisons the task is divided into two subtasks: one concerned with the identification and classification of entities, and the other concerned with the extraction of the semantic relations between these entities. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1.">Subtask A: Entity Recognition</head><p>Given a list of eHealth documents written in Spanish, the goal of this subtask is to identify all the entities per document and their types. These entities are all the relevant terms (single word or multiple words) that represent semantically important elements in a sentence. The following figure shows the relevant entities that appear in a set of example sentences. Some entities ("vías respiratorias" and "60 años") span more than one word. Entities will always consist of one or more complete words (i.e., not a prefix or a suffix of a word), and will never include any surrounding punctuation symbols, parenthesis, etc. There are four types for entities:</p><p>Concept: identifies a relevant term, concept, idea, in the knowledge domain of the sentence.</p><p>Action: identifies a process or modification of other entities. It can be indicated by a verb or verbal construction, such as "afecta" (affects), but also by nouns, such as "exposición" (exposition), where it denotes the act of being exposed to the Sun, and "daños" (damages), where it denotes the act of damaging the skin. It can also be used to indicate non-verbal functional relations, such as "padre" (parent), etc.</p><p>Predicate: identifies a function or filter of another set of elements, which has a semantic label in the text, such as "mayores" (older), and is applied to an entity, such as "personas" (people) with some additional arguments such as ''60 años" (60 years).</p><p>Reference: identifies a textual element that refers to an entity -of the same sentence or of different one-, which can be indicated by textual clues such as "esta", "aquel", etc.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2.">Subtask B: Relation Extraction</head><p>Subtask B continues from the output of Subtask A, by linking the entities detected and labelled in the input document. The purpose of this subtask is to recognise all relevant semantic relationships between the entities recognised. Eight of the thirteen semantic relations defined for this challenge can be identified in Figure <ref type="figure">1</ref>. The semantic relations are divided into the following categories:</p><p>General relations (6): general-purpose relations between two concepts (it involves Concept, Action, Predicate, and Reference) that have a specific semantic. When any of these relations apply, it is preferred over a domain relation -tagging a key phrase as a link between two information units-, since their semantic is independent of any textual label:</p><p>is-a: indicates that one entity is a sub-type, instance, or member of the class identified by the other.</p><p>same-as: indicates that two entities are semantically the same.</p><p>has-property: indicates that one entity has a given property or characteristic.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>part-of:</head><p>indicates that an entity is a constituent part of another.</p><p>causes: indicates that one entity provokes the existence or occurrence of another.</p><p>entails: indicates that the existence of one entity implies the existence or occurrence of another.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Contextual relations (3):</head><p>enable an entity to be refined (it involves Concept, Action, Predicate, and Reference) by attaching modifiers. These are:</p><p>in-time: to indicate that something exists, occurs or is confined to a time-frame, such as in "exposición" i n -t i m e "verano".</p><p>in-place: to indicate that something exists, occurs or is confined to a place or location.</p><p>in-context: to indicate a general context in which something happens, like a mode, manner, or state, such as "exposición" i n -c o n t e x t "prolongada".</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Action roles (2): indicate what role the entities play related to an Action:</head><p>subject: indicates who performs the action, such as in "[el] asma afecta […]".</p><p>target: indicates who receives the effect of the action, such as in "[…] afecta [las] vías respiratorias". Actions can have several subjects and targets, in which case the semantic interpreted is that the union of the subjects performs the action over each of the targets.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Predicate roles (2): indicate which role play the entities related to a Predicate:</head><p>domain: indicates the main entity on which the predicate applies.</p><p>arg: indicates an additional entity that specifies a value for the predicate to make sense. The exact semantic of this argument depends on the semantic of the predicate label, such as in "mayores [de] 60 años", where the predicate label "mayores" indicates that "60 años" is a quantity, that restricts the minimum age for the predicate to be true.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.">Evaluation Scenarios</head><p>The eHealth-KD 2020 Challenge proposes four evaluation scenarios to measure different characteristics of the participant systems. We propose using a micro-averaged 𝐹 1 that weights all individual annotations equally, both entities and relations. Scenario 1 evaluates the solution to both tasks simultaneously, while Scenario 2 and 3 evaluate each task independently. Finally, Scenario 4 challenges systems to a novel domain with significantly less training data. This allows a more fine-grained comparison among systems with respect to specific capacities.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.1.">Main Evaluation (Scenario 1)</head><p>This scenario evaluates both subtasks together as a pipeline. The input consists only of a plain text, and the expected output is a BRAT . a n n file with all the corresponding entities and relations found. The measures will be precision, recall and F1 as follows:</p><formula xml:id="formula_0">𝑅𝑒𝑐 𝐴𝐵 = 𝐶 𝐴 + 𝐶 𝐵 + 1 2 𝑃 𝐴 𝐶 𝐴 + 𝐼 𝐴 + 𝐶 𝐵 + 𝑃 𝐴 + 𝑀 𝐴 + 𝑀 𝐵 𝑃𝑟𝑒𝑐 𝐴𝐵 = 𝐶 𝐴 + 𝐶 𝐵 + 1 2 𝑃 𝐴 𝐶 𝐴 + 𝐼 𝐴 + 𝐶 𝐵 + 𝑃 𝐴 + 𝑆 𝐴 + 𝑆 𝐵 𝐹 1𝐴𝐵 = 2 ⋅ 𝑃𝑟𝑒𝑐 𝐴𝐵 ⋅ 𝑅𝑒𝑐 𝐴𝐵 𝑃𝑟𝑒𝑐 𝐴𝐵 + 𝑅𝑒𝑐 𝐴𝐵</formula><p>The exact definition of Correct(C), Missing(M), Spurious(S), Partial(P) and Incorrect(I) is presented in the following sections for each subtask.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.2.">Optional Subtask A (Scenario 2)</head><p>This scenario only evaluates Subtask A. The input is a plain text with several sentences and the output is a BRAT .ann file with only entity annotations in it (relation annotations are ignored if present).</p><p>To compute the scores we define correct, partial, missing, incorrect and spurious matches. The expected and actual output files do not need to agree on the ID for each entity, nor on their order. The evaluation matches are based on the start and end of text spans and the corresponding type. A brief description about the metrics follows:</p><p>Correct matches are reported when a text in the development file -DEV-matches exactly with a corresponding text span in the gold file for START and END values, and also the entity type. Only one correct match per entry in the gold file can be matched. Hence, duplicated entries will count as Spurious.</p><p>Incorrect matches are reported when START and END values match, but not the type.</p><p>Partial matches are reported when two intervals [START, END] have a non-empty intersection, such as the case of "vías respiratorias" and "respiratorias" in the previous example (and matching LABEL). Notice that a partial phrase will only be matched against a single correct phrase. For example, "tipo de cáncer" could be a partial match for both "tipo" and "cáncer", but it is only counted once as a partial match with the word "tipo". The word "cáncer" is counted then as Missing. This aims to discourage a few large text spans that cover most of the document from getting a very high score.</p><p>Missing matches are those that appear in the GOLD file but not in the DEV file.</p><p>Spurious matches are those that appear in the DEV file but not in the gold file.</p><p>From these definitions, we compute precision, recall, and a standard F1 measure as follows:</p><formula xml:id="formula_1">𝑅𝑒𝑐 𝐴 = 𝐶 𝐴 + 1 2 𝑃 𝐴 𝐶 𝐴 + 𝐼 𝐴 + 𝑃 𝐴 + 𝑀 𝐴 𝑃𝑟𝑒𝑐 𝐴 = 𝐶 𝐴 + 1 2 𝑃 𝐴 𝐶 𝐴 + 𝐼 𝐴 + 𝑃 𝐴 + 𝑆 𝐴 𝐹 1𝐴 = 2 ⋅ 𝑃𝑟𝑒𝑐 𝐴 ⋅ 𝑅𝑒𝑐 𝐴 𝑃𝑟𝑒𝑐 𝐴 + 𝑅𝑒𝑐 𝐴</formula></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.3.">Optional Subtask B (Scenario 3)</head><p>This scenario only evaluates Subtask B. The input is plain text and a corresponding .ann file with the correct entities annotated. The expected output is a .ann file with both entities and relations. For this to happen, the entity annotations from the provided .ann file can be copied with the relation annotations appended.</p><p>To compute the scores we define correct, missing, and spurious matches. The expected and actual output files do not need to agree on the ID for each relation (which is ignored) nor on their order. The evaluation matches are based on the start and end of text spans and the corresponding type. A brief description about the metrics follows:</p><p>Correct: relationships that matched the GOLD file exactly, including the type and the corresponding IDs for each of the participants.</p><p>Missing: relationships that are in the GOLD file but not in the DEV file, either because the type is wrong, or because one of the IDs did not match.</p><p>Spurious: relationships that are in the DEV file but not in the gold file, either because the type is wrong, or because one of the IDs did not match.</p><p>We define standard precision, recall and F1 metrics as follows:</p><formula xml:id="formula_2">𝑅𝑒𝑐 𝐵 = 𝐶 𝐵 𝐶 𝐵 + 𝑀 𝐵 𝑃𝑟𝑒𝑐 𝐵 = 𝐶 𝐵 𝐶 𝐵 + 𝑆 𝐵 𝐹 1𝐵 = 2 ⋅ 𝑃𝑟𝑒𝑐 𝐵 ⋅ 𝑅𝑒𝑐 𝐵 𝑃𝑟𝑒𝑐 𝐵 + 𝑅𝑒𝑐 𝐵</formula></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.4.">Optional Alternative Domain Evaluation (Scenario 4)</head><p>This scenario evaluates a set of 100 sentences from an alternative domain (not health related), to experience with transfer learning techniques. A small development dataset with 100 sentences and their corresponding annotations will be provided when the general test set is released. Participants will need to train their systems in the full eHealth-KD 2020 corpus, and then apply some fine-tuning techniques in the additional 100 sentences from the alternative domain in order to successfully approach this scenario. The input and output format, and evaluation metrics are the same as for Scenario 1.</p><p>The purpose of this scenario, which we consider a complex challenge, is to stimulate the development of systems that can generalise to new knowledge domains without too many additional training examples. Hence, we encourage participants to focus not only on ehealthspecific features and techniques, but also consider more generalizable approaches.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.4.">Corpus Description</head><p>The corpus used in this edition of the challenge is composed of several sources reused from previous challenges, as well as new annotated content. The annotation guidelines and procedure followed were as described in Piad-Morffis et al. <ref type="bibr" target="#b1">[2]</ref>.</p><p>A total of 1000 training and development sentences are reused from the previous edition of the challenge, which is based on the same annotation model and methodology. For the test corpus, a new set of 300 sentences from Medline were manually annotated. An additional 200 sentences were selected from Wikinews, of which 100 were provided for development and 100 for testing in the evaluation Scenario 4. Finally, based on the submissions of the previous edition, an ensemble of 3, 000 sentences automatically annotated was constructed by aggregating the annotations produced by previous participants. These sentences have not been manually revised, hence they are provided as an additional resource for fine-tuning but should be used with care when training a new system. The general statistics of the corpus are summarised in Table <ref type="table" target="#tab_0">1</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Systems Description</head><p>This section briefly describes the eight systems that were submitted to the challenge. In contrast with previous editions, there was a high degree of uniformity among participants, in the sense that most approaches involve the use of deep learning architectures with contextual or static embeddings. Nevertheless, there are interesting differences among the approaches which proved significant with respect to the results obtained. The participant teams and their corresponding systems are described next: Vicomtech <ref type="bibr" target="#b2">[3]</ref> presented an end-to-end deep neural network with pre-trained BERT models as the core for the semantic representation of the input texts. They experimented with two models: BERT-Base Multilingual Cased and BETO, a BERT model pre-trained on Spanish text. They model all the output variables-entities and relations-at the same time, modelling the whole problem jointly. Some of the outputs are fed back to the latter layer of the model, connecting the outcomes of the different sub-tasks in a pipeline fashion.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>TALP-UPC [4]</head><p>presented an end-to-end deep neural network, for simultaneously identifying key-phrases and their relationships, that does not rely on any domain-specific knowledge nor handcrafted features. Input documents are parsed using FreeLing and encoded using either a BERT, a Word2Vec or a FastText pre-trained word-embedding model. In order to generate all possible relations, the model should be run for every input token and have the all raw likelihoods combined across every one of them.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>UH-MAJA-KD [5]</head><p>presented a hybrid model for Subtask A that uses Stacked Bidirectional LSTM layers as contextual encoders, and linear chain Conditional Random Fields as tag decoders. The system addresses Subtask B in a pairwise query fashion, encoding information about the sentence and the given pair of entities using syntactic structures derived from the dependency parse tree, by the means of LSTM-based Recurrent Neural Networks.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>IXA-NER-RE [6]</head><p>presented a two-step model for the NER and RE sub-task, each of them independently developed from the other. The Name Entity Recognition task has been envisaged as a basic seq2seq system applying a general-purpose Language Model and static embeddings. In the RE sub-task, two approaches were explored: transfer learning methods and Matching the Blank to tackle the problem of the reduced size of the training corpus by producing relation representations directly from unlabelled text.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>UH-MatCom [7]</head><p>presented several deep-learning models trained and ensembled to automatically extract the entities and relations. Their models use a combination of state of the art techniques such as BERT, Bi-LSTM, and CRF. They also explore the use of external knowledge sources such as ConceptNet.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>SINAI [8]</head><p>presented a BiLSTM+CRF neural network where different word embeddings are combined as an input to the architecture: custom-generated medical embeddings, contextualised non-medical embeddings, and pre-trained non-medical embeddings based on transformers.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>HAPLAP [9]</head><p>presented a joint AB-LSTM neural network which combines a Bi-LSTM with max pooling and an attentive Bi-LSTM for the relation extraction task. The Joint AB-LSTM is fed with the pre-processed sentences, their entities and relations between those, and distance embeddings.</p><p>ExSim <ref type="bibr" target="#b9">[10]</ref> presented an information retrieval approach in which entities and relations in the training set are compared via word-embedding similarity to determine the most likely label.</p><p>Baseline is a basic implementation that stores all pairs of entities and labels, and all triplets of tow entities and relation labels found in the training set, and simply outputs for the test set a label if it finds an exact match. The purpose of the baseline is to provide participants with a starting point that already takes care of loading the data, parsing the annotation format, and producing the right output.</p><p>By far the most common type of approach corresponds to recurrent deep learning architectures (e.g., LSTM layers) with contextual embeddings (e.g., BERT). This combination is the basis of seven out of eight participant systems. This is not surprising given the recent success of these approaches in several NLP tasks, and in fact it was suggested in the Overview of previous editions of the eHealth-KD Challenge <ref type="bibr" target="#b10">[11]</ref>  <ref type="bibr" target="#b11">[12]</ref>. Variations within this trend include the use of custom rather than pre-trained embeddings and the introduction of knowledge-based features. However, the most significant difference in approach corresponds to systems that perform an end-to-end strategy versus systems that solve each subtask separately. In the previous two editions of the challenge, the best performing system has used an end-to-end strategy. In this edition, two team (Vicomtech and TALP) deploy different end-to-end strategies.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">Systems characteristics</head><p>For describing each system we define a set of characteristics that group the different approaches used by the participants. These characteristics span from abstract concepts as using external knowledge to implementation details such as using transformers or other contextual embeddings. The purpose of these characteristics is to analyse what is common among the systems that perform best in each scenario and possibly identify interesting or unexplored techniques. The characteristics are described below.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>NLP:</head><p>Using classic natural language processing features and strategies, such as TF-IDF encoding, stemming, lemmatization, dependency parsing, etc.</p><p>Static embeddings: Using pre-trained word embeddings such as Word2Vec or Glove, trained on standard corpora.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Contextual embeddings:</head><p>Using contextual embeddings such as BERT or GPT, trained on standard corpora.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Custom embeddings:</head><p>Using any type of embedding with a custom dataset selected for this task or a fine-tunning process.</p><p>Recurrent Network: Using any variant of recurrent neural networks, such as GRU or LSTM, possibly combined with other deep learning architectures.</p><p>Knowledge Bases: Using any source of external semantic knowledge either to define features or to enrich the training set.</p><p>End to end: Designing a single system that is simultaneously trained on both subtasks and shares at least a part of the features, representation or learning parameters for both entities and relations.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Results</head><p>Table <ref type="table" target="#tab_1">2</ref> summarises the results obtained by each participant in each evaluation scenario. Results are sorted by 𝐹 1 in Scenario 1 which is considered the main evaluation. The top three results in each scenario are highlighted in bold.</p><p>Overall the best performing system was presented by Vicomtech <ref type="bibr" target="#b2">[3]</ref> which not only obtains the best result in Scenario 1 (by a significant margin), but also ranks among the top three in all scenarios. Likewise, the system proposed by Talp-UPC <ref type="bibr" target="#b3">[4]</ref> obtains the top result in Scenario 4, which is considered the most difficult scenario given the short number of training examples. It is also worth mentioning the results obtained by UH-MAJA-KD, who also rank among the top results in all scenarios, and the difference with the previous best result is less that 0.001 in two scenarios, which can be considered statistically insignificant.</p><p>Finally, it is interesting to note that the systems that obtained the best results for each individual task (i.e., SINAI in Scenario 2 and IXA-NER-RE in Scenario 3) do not rank among the top three in the general scenarios. This suggests an interesting trade-off between focusing on solving one specific task or designing a generally well-performing system. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.1.">Analysis of Systems Performance</head><p>According to the characteristics defined in Section 3.1, we performed a qualitative analysis of the most successful strategies in each scenario. Figure <ref type="figure" target="#fig_1">2</ref> shows a box-plot of the ranking obtained by systems with each of the characteristics above defined, per evaluation scenario. The box-plot shows the mean, inter-quartile ranges, and the minimum and maximum score among all systems with a given characteristic. As observed, the common strategy of using contextual embeddings and recurrent networks is capable of producing results in the full range of rankings. However, several systems have deployed and tailored this strategy, producing results with a range of variations. Hence, the use of BERT or LSTM layers alone does not guarantee a successful strategy. Likewise, as observed in previous editions, the use of custom embeddings seems to incur a marginal disadvantage, perhaps given that training high-quality embeddings in domain-specific corpora is difficult. On the other hand, the use of enternal knowledge bases to enrich semantic representations seems to be helpful in the entity recognition subtask, as exemplified by the result obtained by SINAI <ref type="bibr" target="#b7">[8]</ref>. The single most successful approach seems to be the design of end-to-end architectures as opposed to solving both subtasks separately. This has been a trend in all the editions of the eHealth-KD challenge and is one of the most significant insights. The fact that end-to-end systems consistently outperform other approaches indicates that there is an interesting interaction between the semantic representation of entities and relations. Both end-to-end approaches presented provide an important advantage in terms of internal feedback exchange when resolving Subtask A and Subtask B, enhancing the discovery of entities and relations. This approach supports the idea that both subtasks are not completely independent of each other. However, as explained in Section 4, while end-to-end systems outperform all other approaches in Scenario 1 and 4, where both subtasks are performed, there are subtask-specific approaches that perform best when only one of the tasks is evaluated.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Conclusions and Future Work</head><p>The eHealth-KD 2020 proposed -as with the previous editions eHealth-KD 2019 <ref type="bibr" target="#b10">[11]</ref> and eHealth-KD 2018 <ref type="bibr" target="#b11">[12]</ref>-the modelling of human language in a scenario in which Spanish electronic health documents could be machine-readable from a semantic point of view. With this task, we expected to encourage the development of software technologies to automatically extract a large variety of knowledge from eHealth documents written in the Spanish Language. For this purpose, a new Spanish language corpus was manually annotated. Likewise, we provided tools to simplify the construction of knowledge discovery systems based on this corpus. In the challenge, eight systems were presented achieving a maximum F1 score of 0.665. All participants presented algorithms in all scenarios, with the the end-to-end systems obtaining best results. The most used significant change to 2020's edition with respect to previous ones is the use of contextual embeddings (i.e., transformer architectures, and specifically BERT) as a replacement of static word embeddings. The results indicate that although promising approaches were presented in the challenge, the extraction of general-purpose semantic relations from natural language text is still an open area of research. Moreover, even though modern deep learning approaches are the most successful, we believe there is still a margin for improvement by incorporating knowledge-based components that can exploit the structure of the annotation model.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>3 Figure 1 :</head><label>31</label><figDesc>Figure 1: Example annotation of three sentences from the eHealth-KD challenge.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>Figure 2 :</head><label>2</label><figDesc>Figure 2: Box-plot of the distribution of ranking for the systems that applied each of the approaches defined in Section 3.1 .</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Table 1</head><label>1</label><figDesc>Summary statistics of the eHealth-KD Corpus v2.0. Key phrases and relation labels are sorted by the number of instances in the training set. The training and development collections (marked with * ) have been reused from previous editions.</figDesc><table><row><cell>Metric</cell><cell cols="6">Total Training DEV/Main DEV/Transfer Test Ensemble</cell></row><row><cell>Sentences</cell><cell>3400</cell><cell>800  *</cell><cell>200  *</cell><cell>100</cell><cell>300</cell><cell>3000</cell></row><row><cell>Entities</cell><cell>25225</cell><cell>5012</cell><cell>1305</cell><cell>1242</cell><cell>2921</cell><cell>14745</cell></row><row><cell>-Concept</cell><cell>16207</cell><cell>3112</cell><cell>797</cell><cell>841</cell><cell>1944</cell><cell>9513</cell></row><row><cell>-Action</cell><cell>6431</cell><cell>1319</cell><cell>340</cell><cell>278</cell><cell>628</cell><cell>3866</cell></row><row><cell>-Predicate</cell><cell>1902</cell><cell>412</cell><cell>124</cell><cell>104</cell><cell>299</cell><cell>963</cell></row><row><cell>-Reference</cell><cell>685</cell><cell>169</cell><cell>44</cell><cell>19</cell><cell>50</cell><cell>403</cell></row><row><cell>Relations</cell><cell>20504</cell><cell>4571</cell><cell>1204</cell><cell>1241</cell><cell>2710</cell><cell>10778</cell></row><row><cell>-target</cell><cell>6376</cell><cell>1281</cell><cell>350</cell><cell>270</cell><cell>562</cell><cell>3913</cell></row><row><cell>-subject</cell><cell>3156</cell><cell>674</cell><cell>170</cell><cell>251</cell><cell>438</cell><cell>1623</cell></row><row><cell>-in-context</cell><cell>2503</cell><cell>502</cell><cell>140</cell><cell>193</cell><cell>380</cell><cell>1288</cell></row><row><cell>-is-a</cell><cell>2013</cell><cell>458</cell><cell>104</cell><cell>119</cell><cell>262</cell><cell>1070</cell></row><row><cell>-in-place</cell><cell>1250</cell><cell>304</cell><cell>77</cell><cell>111</cell><cell>237</cell><cell>521</cell></row><row><cell>-causes</cell><cell>890</cell><cell>292</cell><cell>71</cell><cell>30</cell><cell>92</cell><cell>405</cell></row><row><cell>-domain</cell><cell>994</cell><cell>269</cell><cell>74</cell><cell>82</cell><cell>196</cell><cell>373</cell></row><row><cell>-argument</cell><cell>857</cell><cell>254</cell><cell>73</cell><cell>47</cell><cell>185</cell><cell>298</cell></row><row><cell>-entails</cell><cell>308</cell><cell>117</cell><cell>43</cell><cell>11</cell><cell>28</cell><cell>109</cell></row><row><cell>-in-time</cell><cell>489</cell><cell>126</cell><cell>26</cell><cell>81</cell><cell>127</cell><cell>129</cell></row><row><cell cols="2">-has-property 1088</cell><cell>134</cell><cell>18</cell><cell>18</cell><cell>91</cell><cell>827</cell></row><row><cell>-same-as</cell><cell>346</cell><cell>93</cell><cell>31</cell><cell>19</cell><cell>66</cell><cell>137</cell></row><row><cell>-part-of</cell><cell>234</cell><cell>67</cell><cell>27</cell><cell>9</cell><cell>46</cell><cell>85</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 2</head><label>2</label><figDesc>Results (𝐹 1 metric) in each scenario, sorted by Scenario 1 (column Score). The top results per scenario are highlighted in bold.</figDesc><table><row><cell></cell><cell>Score (𝐹 1 )</cell></row><row><cell>Team</cell><cell>Scn 1 Scn 2 Scn 3 Scn 4 Characteristics</cell></row><row><cell>Vicomtech</cell><cell>0.665 0.820 0.583 0.563 Recurrent Network, Contextual embedding, End-to-end</cell></row><row><cell>Talp-UPC</cell><cell>0.626 0.815 0.574 0.583 Recurrent Network, Contextual embedding, Static embedding, NLP, End-to-end</cell></row><row><cell cols="2">UH-MAJA-KD 0.625 0.814 0.598 0.547 Recurrent Network, Contextual embedding, NLP</cell></row><row><cell>IXA-NER-RE</cell><cell>0.557 0.691 0.633 0.478 Recurrent Network, Contextual embedding, Custom embedding</cell></row><row><cell>UH-MatCom</cell><cell>0.556 0.794 0.545 0.373 Recurrent Network, Contextual embedding, NLP, Knowledge Bases</cell></row><row><cell>SINAI</cell><cell>0.420 0.825 0.461 0.281 Recurrent Network, Contextual embedding, Custom embedding, Knowledge Bases</cell></row><row><cell>HAPLAP</cell><cell>0.395 0.541 0.316 0.137 Recurrent Network, Contextual embedding</cell></row><row><cell>ExSim</cell><cell>0.245 0.314 0.131 0.122 NLP, Static embedding</cell></row></table></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="1" xml:id="foot_0">http://alt.qcri.org/semeval2020/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">http://www.clef-initiative.eu/</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgments</head><p>This research has been partially supported by the University of Alicante and University of Havana, the Generalitat Valenciana (Conselleria d'Educació, Investigació, Cultura i Esport) and the Spanish Government through the projects SIIA (PROMETEO/2018/089, P R O M E T E U / 2 0 1 8 / 0 8 9 ) and LIVING-LANG (RTI2018-094653-B-C22).</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">A general-purpose annotation model for knowledge discovery: Case study in spanish clinical text</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piad-Morffis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Guitérrez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Estevez-Velarde</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Muñoz</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2nd Clinical Natural Language Processing Workshop</title>
				<meeting>the 2nd Clinical Natural Language Processing Workshop</meeting>
		<imprint>
			<date type="published" when="2019">2019</date>
			<biblScope unit="page" from="79" to="88" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">A computational ecosystem to support ehealth knowledge discovery technologies in spanish</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piad-Morffis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Gutiérrez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Almeida-Cruz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Muñoz</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of Biomedical Informatics</title>
		<imprint>
			<biblScope unit="page">103517</biblScope>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">Vicomtech at eHealth-KD Challenge 2020: Deep End-to-End Model for Entity and Relation Extraction in Medical Text</title>
		<author>
			<persName><forename type="first">A</forename><surname>García-Pablos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Perez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Cuadros</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Zotova</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">TALP at eHealth-KD Challenge 2020: Multi-Level Recurrent and Convolutional Neural Networks for Joint Classification of Key-Phrases and Relations</title>
		<author>
			<persName><forename type="first">S</forename><surname>Medina</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Turmo</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">at eHealth-KD Challenge 2020: Deep Learning Models for Knowledge Discovery in Spanish eHealth Documents</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">Rodríguez</forename><surname>Pérez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Caballero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">Mederos</forename><surname>Alvarado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Cruz-Linares</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">P</forename><surname>Consuegra-Ayala</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Uh-Maja-Kd</forename></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">IXA-NER-RE at eHealth-KD Challenge 2020: Cross-Lingual Transfer Learning for Medical Relation Extraction</title>
		<author>
			<persName><forename type="first">E</forename><surname>Andrés</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Sainz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Atutxa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Lopez De Lacalle</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">UH-MatCom at eHealth-KD Challenge 2020: Deep-Learning and Ensemble Models for Knowledge Discovery in Spanish Documents</title>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">P</forename><surname>Consuegra-Ayala</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Palomar</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">SINAI at eHealth-KD Challenge 2020: Combining Word Embeddings for Named Entity Recognition in Spanish Medical Records</title>
		<author>
			<persName><forename type="first">P</forename><surname>López-Ubeda</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">M</forename><surname>Perea-Ortega</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D.-G</forename><surname>Manuel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">T</forename><surname>Martín-Valdivia</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">A</forename><surname>Ureña-López</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">HapLap at eHealth-KD Challenge</title>
		<author>
			<persName><forename type="first">S</forename><surname>Santana</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Pérez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Casillas</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">ExSim at eHealth-KD Challenge</title>
		<author>
			<persName><forename type="first">Z</forename><forename type="middle">Hamzah</forename><surname>Almugbel</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 36th Conference of the Spanish Society for Natural Language Processing<address><addrLine>IberLEF@SEPLN</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2020">2020. 2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Overview of the ehealth knowledge discovery challenge at iberlef</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piad-Morffis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Gutiérrez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">P</forename><surname>Consuegra-Ayala</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Estevez-Velarde</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Almeida-Cruz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Muñoz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Montoyo</surname></persName>
		</author>
		<ptr target="http://ceur-ws.org/Vol-2421/eHealth-KD_overview.pdf" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Iberian Languages Evaluation Forum co-located with 35th Conference of the Spanish Society for Natural Language Processing, IberLEF@SEPLN 2019</title>
				<meeting>the Iberian Languages Evaluation Forum co-located with 35th Conference of the Spanish Society for Natural Language Processing, IberLEF@SEPLN 2019<address><addrLine>Bilbao, Spain</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2019-09-24">2019. September 24th, 2019, 2019</date>
			<biblScope unit="page" from="1" to="16" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">Overview of TASS 2018: Opinions, health and emotions</title>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">M</forename><surname>Cámara</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Almeida-Cruz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">C</forename><surname>Díaz-Galiano</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Estévez-Velarde</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">Á G</forename><surname>Cumbreras</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">G</forename><surname>Vega</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Gutiérrez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Montejo-Ráez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Montoyo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Muñoz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Piad-Morffis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Villena-Román</surname></persName>
		</author>
		<ptr target="http://ceur-ws.org/Vol-2172/p0_overview_tass2018.pdf" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of TASS 2018: Workshop on Semantic Analysis at SEPLN, TASS@SEPLN 2018, co-located with 34nd SEPLN Conference (SEPLN 2018)</title>
				<meeting>TASS 2018: Workshop on Semantic Analysis at SEPLN, TASS@SEPLN 2018, co-located with 34nd SEPLN Conference (SEPLN 2018)<address><addrLine>Sevilla, Spain</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2018-09-18">September 18th, 2018. 2018</date>
			<biblScope unit="page" from="13" to="27" />
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
