<?xml version="1.0" encoding="UTF-8"?><?xml-model type="application/xml-dtd" href="http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article xmlns:ali="http://www.niso.org/schemas/ali/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" dtd-version="1.1d3" specific-use="Marcalyc 1.2" article-type="research-article" xml:lang="es">
<front>
<journal-meta>
<journal-id journal-id-type="redalyc">3442</journal-id>
<journal-title-group>
<journal-title specific-use="original" xml:lang="es">TecnoLógicas</journal-title>
</journal-title-group>
<issn pub-type="ppub">0123-7799</issn>
<issn pub-type="epub">2256-5337</issn>
<publisher>
<publisher-name>Instituto Tecnológico Metropolitano</publisher-name>
<publisher-loc>
<country>Colombia</country>
<email>tecnologicas@itm.edu.co</email>
</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="art-access-id" specific-use="redalyc">344262226006</article-id>
<article-id pub-id-type="doi">https://doi.org/10.22430/22565337.1483</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Sin sección</subject>
</subj-group>
</article-categories>
<title-group>
<article-title xml:lang="es">Cómo adaptar un modelo de aprendizaje profundo a un nuevo dominio: el caso de la extracción de relaciones biomédicas</article-title>
<trans-title-group>
<trans-title xml:lang="en">How to Adapt Deep Learning Models to a New Domain: The Case of Biomedical Relation Extraction</trans-title>
</trans-title-group>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-3879-3320</contrib-id>
<name name-style="western">
<surname>Peña-Torres</surname>
<given-names>Jefferson A.</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<email>jefferson.amado.pena@correounivalle.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0001-9941-6206</contrib-id>
<name name-style="western">
<surname>Gutiérrez</surname>
<given-names>Raúl E.</given-names>
</name>
<xref ref-type="aff" rid="aff4"/>
<email>raul.gutierrez@correounivalle.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-0885-8699</contrib-id>
<name name-style="western">
<surname>Bucheli</surname>
<given-names>Víctor A.</given-names>
</name>
<xref ref-type="aff" rid="aff3"/>
<email>victor.bucheli@correounivalle.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0001-9009-7288</contrib-id>
<name name-style="western">
<surname>González</surname>
<given-names>Fabio A.</given-names>
</name>
<xref ref-type="aff" rid="aff5"/>
<email>fagonzalezo@unal.edu.co</email>
</contrib>
</contrib-group>
<aff id="aff1">
<institution content-type="original">Ingeniero de Sistemas, Escuela de Ingeniería de Sistemas y Computación, Universidad del Valle, Cali- Colombia, jefferson.amado.pena@correounivalle.edu.co</institution>
<institution content-type="orgname">Universidad del Valle</institution>
<country country="CO">Colombia</country>
</aff>
<aff id="aff4">
<institution content-type="original">PhD en Ingeniería, Escuela de Ingeniería de Sistemas y Computación, Universidad del Valle, Cali- Colombia, raul.gutierrez@correounivalle.edu.co</institution>
<institution content-type="orgname">Universidad del Valle</institution>
<country country="CO">Colombia</country>
</aff>
<aff id="aff3">
<institution content-type="original">PhD en Ingeniería, Escuela de Ingeniería de Sistemas y Computación, Universidad del Valle, Cali- Colombia, victor.bucheli@correounivalle.edu.co</institution>
<institution content-type="orgname">Universidad del Valle</institution>
<country country="CO">Colombia</country>
</aff>
<aff id="aff5">
<institution content-type="original">PhD en Ingeniería, Departamento de Ingeniería de Sistemas e Industrial, Universidad de Nacional de Colombia, Bogotá- Colombia, fagonzalezo@unal.edu.co</institution>
<institution content-type="orgname">Universidad Nacional de Colombia</institution>
<country country="CO">Colombia</country>
</aff>
<pub-date pub-type="epub-ppub">
<season>Noviembre-Diciembre</season>
<year>2019</year>
</pub-date>
<volume>22</volume>
<fpage>49</fpage>
<lpage>62</lpage>
<history>
<date date-type="received" publication-format="dd mes yyyy">
<day>25</day>
<month>09</month>
<year>2019</year>
</date>
<date date-type="accepted" publication-format="dd mes yyyy">
<day>19</day>
<month>11</month>
<year>2019</year>
</date>
</history>
<permissions>
<copyright-statement>Atribución-NoComercial-CompartirIgual 4.0 Internacional (CC BY-NC-SA 4.0)</copyright-statement>
<copyright-year>2019</copyright-year>
<copyright-holder>Instituto Tecnológico Metrpolitano</copyright-holder>
<ali:free_to_read/>
<license xlink:href="https://creativecommons.org/licenses/by-nc-sa/4.0/deed.es">
<ali:license_ref>https://creativecommons.org/licenses/by-nc-sa/4.0/deed.es</ali:license_ref>
<license-p>Atribución-NoComercial-CompartirIgual 4.0 Internacional (CC BY-NC-SA 4.0)</license-p>
</license>
</permissions>
<abstract xml:lang="es">
<title>Resumen</title>
<p>En este trabajo estudiamos el problema de extracción de relaciones del Procesamiento de Lenguaje Natural (PLN). Realizamos una configuración para la adaptación de dominio sin recursos externos. De esta forma, entrenamos un modelo con aprendizaje profundo (DL) para la extracción de relaciones (RE). El modelo permite extraer relaciones semánticas para el dominio biomédico. Sin embargo, ¿El modelo puede ser aplicado a diferentes dominios? El modelo debería adaptarse automáticamente para la extracción de relaciones entre diferentes dominios usando la red de DL. Entrenar completamente modelos DL en una escala de tiempo corta no es práctico, deseamos que los modelos se adapten rápidamente de diferentes conjuntos de datos con varios dominios y sin demora. Así, la adaptación es crucial para los sistemas inteligentes que operan en el mundo real, donde los factores cambiantes y las perturbaciones imprevistas son habituales. En este artículo, presentamos un análisis detallado del problema, una experimentación preliminar, resultados y la discusión acerca de los resultados.</p>
</abstract>
<trans-abstract xml:lang="en">
<title>Abstract</title>
<p>In this article, we study the relation extraction problem from Natural Language Processing (NLP) implementing a domain adaptation setting without external resources. We trained a Deep Learning (DL) model for Relation Extraction (RE), which extracts semantic relations in the biomedical domain. However, can the model be applied to different domains? The model should be adaptable to automatically extract relationships across different domains using the DL network. Completely training DL models in a short time is impractical because the models should quickly adapt to different datasets in several domains without delay. Therefore, adaptation is crucial for intelligent systems, where changing factors and unanticipated perturbations are common. In this study, we present a detailed analysis of the problem, as well as preliminary experimentation, results, and their evaluation.</p>
</trans-abstract>
<kwd-group xml:lang="en">
<title>Keywords</title>
<kwd>Semantic Extraction</kwd>
<kwd>Deep Learning</kwd>
<kwd>Relation Extraction</kwd>
<kwd>Natural Language Processing</kwd>
</kwd-group>
<kwd-group xml:lang="es">
<title>Palabras clave</title>
<kwd>Extracción semántica</kwd>
<kwd>Aprendizaje profundo</kwd>
<kwd>Extracción de relaciones</kwd>
<kwd>Procesamiento de lenguaje natural</kwd>
</kwd-group>
<counts>
<fig-count count="1"/>
<table-count count="6"/>
<equation-count count="0"/>
<ref-count count="47"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>Cómo citar / How to cite</meta-name>
<meta-value>J. A. Peña-Torres, R. E. Gutiérrez, V. A. Bucheli, F. A. González, “How to Adapt Deep Learning Models to a New Domain: The Case of Biomedical Relation Extraction”, <italic>TecnoLógicas</italic>, vol. 22, pp. 49-62, 2019. https://doi.org/10.22430/22565337.1483</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec>
<title>
<bold>1. INTRODUCTION</bold>
</title>
<p>In this study, we address the Relation Extraction (RE) problem as follows: For a given sentence <italic>S</italic>, the RE problem is a classification problem, where the goal is to predict a semantic relation <italic>r</italic> between e<sub>1 </sub>and e<sub>2</sub>, both entities in <italic>S</italic>, following previous research, mainly <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup>, as our baseline model. RE plays a key role in information extraction from unstructured text, and it has a wide range of applications in many domains <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref1">2</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref3">4</xref>]</sup>.</p>
<p>The rapid growth of unstructured text data and the valuable knowledge recorded in them has generated considerable interest in automatic detection and extraction of semantic relations <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref4">5</xref>]</sup>.</p>
<p>Although many studies have been conducted to develop supervised relation extraction models <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref5">6</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref8">9</xref>]</sup>, neural network-based approaches have been proposed for relation extraction, in particular with deep learning, e.g., Recursive Neural Networks <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref9">10</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref11">12</xref>]</sup>, Recurrent Neural Networks (RNNs) <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref12">13</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref14">15</xref>]</sup>, and Convolutional Neural Networks (CNNs) <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>], [<xref ref-type="bibr" rid="redalyc_344262226006_ref1">2</xref>], [<xref ref-type="bibr" rid="redalyc_344262226006_ref15">16</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref17">18</xref>]</sup>.</p>
<p>Deep Learning (DL) has demonstrated its efficiency in improving the RE task.</p>
<p>Specifically regarding relations in English language, the deep learning (DL) models have been trained with little or no domain knowledge, and several studies have implemented DL methods for relation extraction from texts. However, depending on the language and domain of deep learning models for relation extraction, the following challenges may arise: (a) a lack of training samples in some languages and domains and (b) the generalization of model in a domain with different types of relations.</p>
<p>Against this backdrop, some researchers have been successful in performing RE for a specific domain. They have utilized large amounts of labelled data. However, there are insufficient labelled data for certain domains and languages. Therefore, domain adaptation, domain shift, domain bias, and domain transfer are used to perform relation extraction an unseen target domain or language. However, the factors and conditions that are appropriate for training and testing DL models with different types of datasets in a target domain or language should be explored. Therefore, transferring well-trained DL models to other domains remains a challenge.</p>
<p>This paper presents a baseline DL model <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup> and an experiment conducted using multiple representations from the biomedical domain. To address both challenges mentioned above, we describe the impact of some biomedical datasets, the generalization capability of the deep learning model, and compare its performance when some representations of the baseline model are modified for the biomedical domain.</p>
<p>This paper is organized as follows.</p>
<p>Section 2 presents a DL model based on <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>], [<xref ref-type="bibr" rid="redalyc_344262226006_ref15">16</xref>]</sup> for relation extraction, considering the potential of DL for RE tasks in bioinformatics research (biology, biomedicine, and healthcare). Section 3 describes a suitable way to adapt a well-trained model to the biomedical domain.</p>
<p>Section 4 details the experimental setup and the evaluation of the baseline model on multiple public PPI, DDI and CPI corpora. The last two sections discuss and summarize the representations of the impacts and the behavior of the baseline model on the datasets.</p>
</sec>
<sec>
<title>
<bold>2. RELATED WORK</bold>
</title>
<p>Traditionally, Relation Extraction (RE) has been a classification problem that occurs between two or more named entities in the same sentence that have a semantic relationship. Depending on the number of semantic relation classes, RE tasks can be binary or multi-class. In this study, we considered a binary relation extraction task in the biomedical domain. <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref18">19</xref>]-[<xref ref-type="bibr" rid="redalyc_344262226006_ref21">22</xref>]</sup>.</p>
<p>Said task achieves a high performance with supervised approaches; however, it needs annotated data, which is time consuming and entails intensive human labor.  Recently, models based on deep neural networks, such as CNNs and RNNs, have shown promising results for RE.</p>
<p>For example, in <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup>, the authors explored RE without exhaustive pre-processing. They employed a CNN and observed that any automatically learned features yielded promising results and could potentially replace the manually designed features.</p>
<p>In turn, in <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref9">10</xref>], [<xref ref-type="bibr" rid="redalyc_344262226006_ref22">23</xref>]</sup> other authors proposed a DL approach with a RNN architecture and a matrix-vector word representation to explore the impact of the lack of explicit knowledge about the type of relation.  Likewise, a study <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref10">11</xref>]</sup> compared the capabilities of CNN and RNN for the relation classification task. We reviewed other articles on relation extraction without specific domain. We also surveyed some models in the literature classified by network architecture and dataset. We hope this survey provides an overview to select a baseline model.</p>
<p>In <xref ref-type="table" rid="gt1">Table 1</xref>, the baseline is marked in boldface, the CNN and RNN-based Models are learned on SemEval 2010, and the category Others is relevant for Deep Learning and RE tasks.</p>
<p>Table 1. Survey of studies into RE tasks using Deep Learning approaches.</p>
<p>
<table-wrap id="gt1">
<label>Table 1</label>
<caption>
<title>Survey of studies into RE tasks using Deep Learning approaches</title>
</caption>
<alt-text>Table 1 Survey of studies into RE tasks using Deep Learning approaches</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt2.png" position="anchor" orientation="portrait"/>
<table style="width:451.0pt;border-collapse:collapse;border:none;" id="gt2-526564616c7963">
<tbody>
<tr style="height:10.6pt">
<td style="width:451.0pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.6pt" colspan="2">
<bold>CNN-based Models</bold>
</td>
</tr>
<tr style="height:10.2pt">
<td style="width:216.55pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.2pt">MODEL</td>
<td style="width:234.45pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.2pt">F1</td>
</tr>
<tr style="height:12.75pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:12.75pt">CNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:12.75pt">82.7</td>
</tr>
<tr style="height:11.65pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.65pt">CR-CNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref16">17</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.65pt">84.1</td>
</tr>
<tr style="height:10.45pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.45pt">CNN<sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref15">16</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.45pt">82.8</td>
</tr>
<tr style="height:8.7pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.7pt">Attention- CNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref23">24</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.7pt">85.4</td>
</tr>
<tr style="height:15.5pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:15.5pt">depLCNN + NS <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref17">18</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:15.5pt">85.6</td>
</tr>
<tr style="height:10.8pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.8pt">Multi-Attention CNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref24">25</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.8pt">88.0</td>
</tr>
<tr style="height:9.7pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.7pt">Selection-Attention + CNN<sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref25">26</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.7pt">88.0</td>
</tr>
<tr style="height:8.65pt">
<td style="width:451.0pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.65pt" colspan="2">
<bold>RNN-based Models</bold>
</td>
</tr>
<tr style="height:7.5pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:7.5pt">MV-RNN</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:7.5pt">82.4</td>
</tr>
<tr style="height:13.55pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:13.55pt">Entity-Att BLSTM<sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref9">10</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:13.55pt">85.2</td>
</tr>
<tr style="height:11.0pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.0pt">Hierarchical Attention BILSTM <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref26">27</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.0pt">84.3</td>
</tr>
<tr style="height:9.9pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.9pt">Attention BILSTM<sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref27">28</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.9pt">84.0</td>
</tr>
<tr style="height:8.8pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.8pt">BILSTM <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref13">14</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.8pt">82.7</td>
</tr>
<tr style="height:7.7pt">
<td style="width:451.0pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:7.7pt" colspan="2">
<bold>Others</bold>
</td>
</tr>
<tr style="height:6.55pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:6.55pt">BRNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref28">29</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:6.55pt">86.3</td>
</tr>
<tr style="height:12.65pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:12.65pt">DRNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref29">30</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:12.65pt">86.1</td>
</tr>
<tr style="height:10.8pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.8pt">SDP-LSTM <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref12">13</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.8pt">83.7</td>
</tr>
<tr style="height:9.65pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.65pt">DepNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref30">31</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.65pt">83.6</td>
</tr>
<tr style="height:11.95pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt">FCN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref31">32</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt">83.0</td>
</tr>
<tr style="height:7.5pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:7.5pt">RCNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref32">33</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:7.5pt">96.5</td>
</tr>
<tr style="height:11.95pt">
<td style="width:216.55pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt">PCNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref33">34</xref>]</sup>
</td>
<td style="width:234.45pt;border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt">84.0</td>
</tr>
<tr style="height:11.95pt">
<td style="width:216.55pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt"/>
<td style="width:234.45pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:11.95pt"/>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
<p>Most of the studies we reviewed are concerned with English language, and their models have not been extended to other languages or domains. There is a variety of possible relations between domains and languages, characterized by their own syntactic and lexical properties.</p>
<p>Nevertheless, the notion of a relation, what it “means”, is inherently ambiguous <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref34">35</xref>]</sup>. Many efforts have been devoted to biomedical relation extraction, whose goal is to discover valuable knowledge about proteins, drugs, diseases, genes, adverse effects, and other biological interactions from unstructured free text <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref35">36</xref>]</sup>.</p>
</sec>
<sec>
<title>
<bold>3. METHODOLOGY</bold>
</title>
<p>In this section, we introduce a model architecture based on Convolutional Neural Networks (CNN) and modifications that allow other representations.</p>
<sec>
<title>
<bold>3.1 Model</bold>
</title>
<p>Based on the literature review above, with better performance architecture for RE tasks is CNN <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref36">37</xref>]</sup>. The model used in this paper contains three components: (a) a convolutional layer with multiple windows sizes, (b) a max pooling layer, and (c) a fully connected layer with dropout and softmax. Additionally, the input data undergoes a pre-transformation to vector representation. The transformation from words to vector representations has been described by several authors <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref37">38</xref>], [<xref ref-type="bibr" rid="redalyc_344262226006_ref38">39</xref>]</sup>.</p>
<p>We considered the model in <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup> as baseline model, and trained it to automatically find relevant information (features or patterns) in a source sentence to predict semantic relations. We also added several modifications to keep some key elements of the baseline model that are consistent and consequent with a RE task. The diagram of the baseline model is shown in <xref ref-type="fig" rid="gf1">Fig. 1</xref>.</p>
<p>
<fig id="gf1">
<label>Fig. 1.</label>
<caption>
<title>Diagram of the CNN-based model architecture implemented in this case study.</title>
<p>(a) Words from a sample sentence represented as vectors (Input layer). (b) Vector representation where convolutional kernels are applied (Convolutional layer). (c) Vector pooling resulting from convolutional kernel. (d) Max values representative of the relation.</p>
</caption>
<alt-text>Fig. 1. Diagram of the CNN-based model architecture implemented in this case study.</alt-text>
<graphic xlink:href="344262226006_gf2.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<p>CNN-based architectures learn semantic information from sentences in the hidden layers during training. Although the extraction of semantic information is not previously known, the convolution layers learn features in the representations of the source domain. In the baseline model, let <italic>S</italic> be an input sentence that could be represented as <italic>S</italic> = {w<sub>1</sub>, w<sub>2</sub>, w<sub>3</sub>…w<sub>n</sub>}, where w<sub>i</sub> is the ith word in S; and let <italic>V</italic> be the vocabulary size of each dataset and Vxd, the embedding matrix with a <italic>d</italic> dimensional vector from pre-trained word embeddings.</p>
<p>Since we aim to compare the modifications and addition of representations to the baseline model in the biomedical domain, we used different kernel sizes and softmax function modifications; afterward, we included multi representations that captured different characteristics from the input. All of them were gradually changed. Then, for each w<sub>i</sub> in <italic>S</italic>, the distributional and not distributional representation was obtained and concatenated in a vector. As result, a matrix representing <italic>S</italic> was processed by the model in order to perform the classification.</p>
<p>This is a crucial part of our study in order to extract semantic relations, we needed to change the preprocessing, context length, paddings, kernel sizes, and validate implementation of baseline model.</p>
<p>Moreover, each word vector was supported by its corresponding information.</p>
</sec>
<sec>
<title>
<bold>3.2 Representations</bold>
</title>
<p>Representations have been effective tools to address the growing interest in DL for NLP tasks. While classical techniques used feature engineering and exploration to provide a more qualitative assessment and analysis of results from the point of view of computational linguistics, DL models learn features automatically.</p>
<p>In this paper, before <italic>S</italic> is processed by the baseline model, it is transformed in the form of a vector to capture different characteristics of the token; nevertheless, more information could be obtained from sentences to enhance automatic characterization via CNNs.</p>
<p>Multi-representation in DL models must be robust, and they should perform a satisfactory relation extraction in similar tasks across different domains. We used the following representations to add characteristic elements of sentences.</p>
<p>
<bold>Word Embedding</bold>: It is employed to capture syntactic and semantic meanings of words in distributed representations.</p>
<p>In characterized by their own syntactic and lexical sentence S, every word w<sub>i</sub> is represented by a real-valued vector.</p>
<p>These word representations are encoded in an embedding matrix X<sup>d</sup>, where V is a fixed-sized vocabulary.</p>
<p>Unfortunately, said word representations usually take a long time to train, and freely available trained word embeddings are commonly implemented <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref39">40</xref>]</sup>. We used pre-trained word2vec <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref37">38</xref>]</sup>, Glove <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref38">39</xref>]</sup>, and FastText <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref40">41</xref>]</sup> to conduct the experiments.</p>
<p>
<bold>Position Embedding</bold>: In RE tasks, the words close to entities are usually informative and determine the relation between entities. We prove the relative position of words an entities similar to <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup>.</p>
<p>We used the relative position of both entity pairs. Apparently, it is not possible to capture such structural information only through semantic and syntactic word features. It is necessary to specify which input tokens are the target nouns in the sentence and where they are placed.</p>
<p>The position characterized by their own syntactic and lexical of entities is a relative distance, which is also mapped to vector representations.</p>
</sec>
</sec>
<sec>
<title>
<bold>4. EXPERIMENTS</bold>
</title>
<p>These experiments are intended to show that DL models (baseline) for Relation Extraction (RE) can be adapted to another domain using multi-representation. First, we introduce the datasets and the metrics to evaluate precision: recall and f1-score. Next, we describe the parameters of the baseline model, the evaluation of the multi-representation, its effects, and performance on the data. Finally, we compare the performance of the baseline model with the modified model.</p>
<sec>
<title>
<bold>4.1. Datasets in the biomedical domain</bold>
</title>
<p>In this study, we explored RE tasks focused on the biomedical domain, especially relations such as protein-protein interactions (PPIs), drug-drug interactions (DDIs), and chemical-protein interactions (CPIs). Several scarce resources were utilized to adapt a pre-trained model.</p>
<p>We used three annotated corpora in the biomedical domain. All of them are publicly available and detailed below.</p>
<p>To extract semantic relations regarding Adverse Drug Effects, a subtask of DDI was applied to the corpus ADE-EX, as follows. The sentence “<italic>we report two cases of pseudoporphyria caused by naproxen and oxaprozin</italic>” contains a semantic relation of the type Adverse Drug Effect between <italic>pseudoporphyria</italic> and <italic>oxaprozin</italic>.</p>
<p>In turn, in BioInfer, we used the Protein-Protein interaction task to find semantic relations in the sentence “<italic>snf11 a new component of the yeast snf-swi complex that interacts with a conserved region of snf2</italic>”, where <italic>snf11</italic> and <italic>snf2</italic> are two named entities that represent proteins.</p>
<p>Likewise, in the corpus ChemProt, Chemical-Protein interactions are annotated. For example, in the sentence “<italic>Discovery of novel 2-hydroxydiarylamide derivatives as TMPRSS4 inhibitors</italic>”, 2-<italic>hydroxydiarylamide</italic> is a chemical and <italic>TMPRSS4</italic> is a protein with a semantic relation to said chemical. For protein-protein interactions (relations), we used the BioInfer dataset <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref41">42</xref>]</sup>. For adverse drug events, we used the ADE corpus <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref42">43</xref>]</sup>; and, for chemical-protein interactions, we used the ChemProt corpus <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref43">44</xref>]</sup>. The detailed information of each dataset is listed in <xref ref-type="table" rid="gt2">Table 2</xref>, <xref ref-type="table" rid="gt3">Table 3</xref> and <xref ref-type="table" rid="gt4">Table 4</xref>, respectively.</p>
<p>
<table-wrap id="gt2">
<label>Table 2</label>
<caption>
<title>Summary statistics of BioInfer dataset.</title>
</caption>
<alt-text>Table 2 Summary statistics of BioInfer dataset.</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt3.png" position="anchor" orientation="portrait"/>
<table style="width:282.65pt;border-collapse:collapse;border:none;" id="gt3-526564616c7963">
<tbody>
<tr style="height:11.45pt">
<td style="width:72.9pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.45pt">
<bold>Name</bold>
</td>
<td style="width:79.2pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.45pt">
<bold>Sentences</bold>
</td>
<td style="width:73.65pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.45pt">
<bold>Positives samples</bold>
</td>
<td style="width:56.9pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.45pt">
<bold>Total</bold>
</td>
</tr>
<tr style="height:8.55pt">
<td style="width:72.9pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.55pt">BioInfer</td>
<td style="width:79.2pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.55pt">1100</td>
<td style="width:73.65pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.55pt">2534</td>
<td style="width:56.9pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:8.55pt">9666</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: [<xref ref-type="bibr" rid="redalyc_344262226006_ref41">42</xref>].</attrib>
</table-wrap>
</p>
<p>
<table-wrap id="gt3">
<label>Table 3</label>
<caption>
<title>Summary statistics of ADEEX dataset</title>
</caption>
<alt-text>Table 3 Summary statistics of ADEEX dataset</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt4.png" position="anchor" orientation="portrait"/>
<table style="width:349.75pt;border-collapse:collapse;border:none;" id="gt4-526564616c7963">
<tbody>
<tr style="height:9.0pt">
<td style="width:89.3pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Name</bold>
</td>
<td style="width:100.55pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Sentences</bold>
</td>
<td style="width:89.95pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Positives samples</bold>
</td>
<td style="width:69.95pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Total</bold>
</td>
</tr>
<tr style="height:3.75pt">
<td style="width:89.3pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:3.75pt">ADE</td>
<td style="width:100.55pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:3.75pt">4272</td>
<td style="width:89.95pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:3.75pt">988</td>
<td style="width:69.95pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:3.75pt">3184</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: [<xref ref-type="bibr" rid="redalyc_344262226006_ref42">43</xref>].</attrib>
</table-wrap>
</p>
<p>
<table-wrap id="gt4">
<label>Table 4</label>
<caption>
<title>Summary statistics of ChemProt dataset</title>
</caption>
<alt-text>Table 4 Summary statistics of ChemProt dataset</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt5.png" position="anchor" orientation="portrait"/>
<table style="width:355.5pt;border-collapse:collapse;" id="gt5-526564616c7963">
<tbody>
<tr style="height:.85pt">
<td style="width:117.3pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:.85pt"/>
<td style="width:238.2pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:.85pt" colspan="3">
<bold>Positives samples</bold>
</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border-top:none;border-left:none;   border-bottom:solid windowtext 1.0pt;border-right:solid windowtext 1.0pt;         padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Relation</bold>
</td>
<td style="width:130.3pt;border:none;border-bottom:solid windowtext 1.0pt;         padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>Training Set</bold>
</td>
<td style="width:53.5pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>Dev. set</bold>
</td>
<td style="width:54.35pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>Test set</bold>
</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Active</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">786</td>
<td style="width:53.5pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">550</td>
<td style="width:54.35pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">664</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Inhibitor</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">2251</td>
<td style="width:53.5pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">1092</td>
<td style="width:54.35pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:   9.0pt">1661</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Agonist</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">170</td>
<td style="width:53.5pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">116</td>
<td style="width:54.35pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:   9.0pt">194</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Antagonist</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">234</td>
<td style="width:53.5pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">197</td>
<td style="width:54.35pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:   9.0pt">281</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Substrate</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">705</td>
<td style="width:53.5pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">457</td>
<td style="width:54.35pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:   9.0pt">643</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border:none;border-right:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">Negative</td>
<td style="width:130.3pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">12461</td>
<td style="width:53.5pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">8070</td>
<td style="width:54.35pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:   9.0pt">11013</td>
</tr>
<tr style="height:9.0pt">
<td style="width:117.3pt;border-top:none;border-left:none;   border-bottom:solid windowtext 1.0pt;border-right:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.0pt">
<bold>Total</bold>
</td>
<td style="width:130.3pt;border:none;border-bottom:solid windowtext 1.0pt;      padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>16589</bold>
</td>
<td style="width:53.5pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>10482</bold>
</td>
<td style="width:54.35pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:9.0pt">
<bold>14456</bold>
</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: [<xref ref-type="bibr" rid="redalyc_344262226006_ref43">44</xref>].</attrib>
</table-wrap>
</p>
<p>BioInfer, a public resource providing an annotated corpus of biomedical English, is aimed at the development of Information Extraction (IE) systems and their components in the biomedical domain.</p>
<p>The ADE (Adverse Drug Effect) corpus consists of MEDLINE case reports annotated with drugs and conditions (e.g., diseases, signs and symptoms), along with untyped relationships between them.</p>
<p>ChemProt consists of PubMed abstracts annotated with chemical and protein entities. The relations were annotated with 10 chemical-protein relations. According to the shared task description, only 5 out of 10 semantic relation types would be evaluated.</p>
<p>Other important datasets for our study are SemEval-2010_Task_8 datasets <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref44">45</xref>]</sup> and ACE 2005 from LDC (Linguistic Data Consortium) <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref45">46</xref>]</sup>. Both were used in the baseline model, and their statistics are presented below.</p>
<p>
<bold>SemEval 2010 task 8</bold> is focused on multi-way classification between pairs of nominals. The task was designed to compare different approaches to semantic relation classification.</p>
<p>
<bold>ACE-2005</bold> consists of 6 main sources: broadcast news (bn), newswire (nw), broadcast conversation (bc), telephone conversation (cts), weblogs (wl), and usenet (un).</p>
<p>
<bold>reACE</bold>, (Edinburgh Regularized Automatic Content Extraction) consists of English broadcast news and newswires with several annotated entities, such as organization, person, fvw (facility, vehicle or weapon), and gpl (geographical, political or location), along with relationships between them. Relationships are classified into five types: general-affiliation, organization-affiliation, part-whole, personal-social, and agent-artifact.</p>
</sec>
<sec>
<title>
<bold>4.2 Measures</bold>
</title>
<p>For the relation classification task, we used the F1-score as our measure for evaluation. The F1-score is defined as the harmonic mean between precision (P) and recall (R), such that, Precision = TP/ (TP+FP). Precision is the ratio of correctly predicted positive relations to the total predicted positive relations. In turn, Recall is the ratio TP / (TP + FN). Recall is the intuitive ability of the classifier to find all the positive samples. The F1-score is the weighted average of Precision and Recall.</p>
<p>F1 Score = 2*(Recall * Precision) / (Recall + Precision), where TP, FP and FN are true positives, false positives, and false negatives, respectively.</p>
</sec>
<sec>
<title>
<bold>4.3 Hyperparameters and resources</bold>
</title>
<p>We considered a baseline model as a traditional approach to word representations and a CNN model with several windows without the combination of multi-representation. The benefit of multiple window sizes has been demonstrated; here, we used {3, 4} and {2, 3, 4, 5} to generate features. We tested several word representations with sizes d=50 and d=100, while the dimensionality of entity position indicators was d=20. Other parameters are listed in<xref ref-type="table" rid="gt5"> Table 5</xref>.</p>
<p>
<table-wrap id="gt5">
<label>Table 5</label>
<caption>
<title>Best hyper parameter configuration in our mode</title>
</caption>
<alt-text>Table 5 Best hyper parameter configuration in our mode</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt6.png" position="anchor" orientation="portrait"/>
<table style="width:310.1pt;border-collapse:collapse;border:none;" id="gt6-526564616c7963">
<tbody>
<tr style="height:13.1pt">
<td style="border-top:solid windowtext 1.0pt;border-left:none;border-bottom:   solid windowtext 1.0pt;border-right:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:13.1pt">
<bold>Parameter</bold>
</td>
<td style="border-top:solid windowtext 1.0pt;border-left:none;border-bottom:   solid windowtext 1.0pt;border-right:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:13.1pt">
<bold>Range</bold>
</td>
<td style="border-top:solid windowtext 1.0pt;border-left:none;border-bottom:   solid windowtext 1.0pt;border-right:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:13.1pt">
<bold>Selected</bold>
</td>
</tr>
<tr style="height:10.5pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.5pt">Dropout rate</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.5pt">0.2 – 0.5</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.5pt">0.5</td>
</tr>
<tr style="height:15.45pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">Weight decay</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">0 - 1e-10</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">1e-5</td>
</tr>
<tr style="height:11.85pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.85pt">Optimizer</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.85pt">-</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:11.85pt">Adam</td>
</tr>
<tr style="height:10.8pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.8pt">Learning rate</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.8pt">[0.1, 0.01, 0.001]</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.8pt">0.001</td>
</tr>
<tr style="height:9.7pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.7pt">Decay learning rate</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.7pt">true, false</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:9.7pt">True</td>
</tr>
<tr style="height:8.65pt">
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:8.65pt">Number of epochs</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:8.65pt">20, 50, 80, 100</td>
<td style="border:none;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:8.65pt">100</td>
</tr>
<tr style="height:15.45pt">
<td style="border:none;border-bottom:solid windowtext 1.0pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">Batch size</td>
<td style="border:none;border-bottom:solid windowtext 1.0pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">[16, 30, 50, 128]</td>
<td style="border:none;border-bottom:solid windowtext 1.0pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;height:15.45pt">50</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
</sec>
</sec>
<sec>
<title>
<bold>5. RESULTS AND DISCUSSION</bold>
</title>
<p>The performance of the datasets SemEval 2010, ADE, BioInfer, Chemprot, and reACE is presented in <xref ref-type="table" rid="gt6">Table 6</xref> with the F1-score. Overall, we can make two observations: (1) The baseline model is not stable for each dataset. Although the predictions of the baseline model are not sufficient to establish what happened, the performance is meant to provide a neutral benchmark to measure the effects of adaptation changes. (2) Our models did not produce, in terms of performance, results comparable to those reported with the baseline model when biomedical domain datasets were used. ADE and reACE contain an imbalanced class distribution, which is perhaps the reason behind their 99.56 and 25.24 performance, respectively.</p>
<p>
<table-wrap id="gt6">
<label>Table 6</label>
<caption>
<title>Weighted F1scores of the baseline and the four dataset variations baseline score marked in boldface</title>
</caption>
<alt-text>Table 6 Weighted F1scores of the baseline and the four dataset variations baseline score marked in boldface</alt-text>
<alternatives>
<graphic xlink:href="344262226006_gt7.png" position="anchor" orientation="portrait"/>
<table style="width:312.35pt;border-collapse:collapse;" id="gt7-526564616c7963">
<tbody>
<tr style="height:1.1pt">
<td style="width:154.95pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:1.1pt">
<bold>Dataset</bold>
</td>
<td style="width:157.4pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:5.0pt 5.0pt 5.0pt 5.0pt;height:1.1pt">
<bold>F1</bold>
</td>
</tr>
<tr style="height:10.9pt">
<td style="width:154.95pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.9pt">SemEval2010</td>
<td style="width:157.4pt;border:none;   padding:5.0pt 5.0pt 5.0pt 5.0pt;height:10.9pt">
<bold>82.76</bold>
<bold/>
</td>
</tr>
<tr style="height:10.9pt">
<td style="width:154.95pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">ADE</td>
<td style="width:157.4pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">99.56</td>
</tr>
<tr style="height:10.9pt">
<td style="width:154.95pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">BioInfer</td>
<td style="width:157.4pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">38.50</td>
</tr>
<tr style="height:10.9pt">
<td style="width:154.95pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">reACE</td>
<td style="width:157.4pt;padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">25.24</td>
</tr>
<tr style="height:10.9pt">
<td style="width:154.95pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">ChemProt</td>
<td style="width:157.4pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:5.0pt 5.0pt 5.0pt 5.0pt;   height:10.9pt">59.80</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
<p>Our hypothesis is that, as sample relations are extracted from an unbalanced corpus, our baseline model is more sensitive and a significant performance gap is produced. Our model, on the ADE corpus, achieved a high F1-score; however, the variation between the lowest and highest values of F1 in other datasets does not guarantee a superior performance.</p>
<p>This is perhaps not surprising since in-domain datasets contain short fragments of texts with scarce grammatical information, from which convolutions can capture relevant biomedical information and achieve a high F1. Moreover, after comparing CNN performance, we hypothesize that general and biomedical domain have equally or similarly difficult for RE task, when there is a difference across domain and domain models.</p>
<p>With supervised domain training and the model needs to capture knowledge and learn automatically features from the target domain. While we suspect there is still room for improvement, without utilizing domain specific information, the datasets may differ in ways we cannot account for with our reasoning.</p>
<p>Our baseline model exhibits two main aspects: First, unbalanced corpora have a negative impact on the F1-score.</p>
<p>More importantly, using a corpus with a balanced proportion of positive to negative relations can result in a better performance. Second, there are a number element in a deep learning model implementation, which makes exact replication of the results difficult, particularly performance results, but we compared our modified model from CNN base model (baseline), and the performance was quite similar. We believe our performance can be attributed to (1) vector representation and (2) class imbalance from the dataset. Thus, in-domain word embeddings and position embedding combinations are better for our model than out-of-domain word embeddings, although they cannot achieve results comparable to those of the baseline.</p>
<p>We presented a multi-step reasoning to train a model for other domains in cases in which data with other distribution and classes is available and the task is the same.</p>
<p>We also showed that our reasoning for model adaptation did not achieve a performance similar to that of the baseline model. Therefore, we carried out corpus-based exploration to address the adaptation of a deep learning model. We evaluated the DL model on different datasets.  We also tested the deep learning model to extract semantic relations between entities implementing a similar experimental setup to that in the study by Zeng et. al <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref0">1</xref>]</sup>.</p>
<p>After training and testing, our DL model should have learned how to extract semantic relationships due to the automatic learning of similar in-domain and out-of-domain features. However, our results confirm the need for a balanced dataset and additional information about the in-domain task. The proportion of positive and negative relations and the number of annotated data in the samples are different in each dataset (ADE, BioInfer, reACE, Chemprot, and SemEval).</p>
<p>the in-domain task. The proportion of positive and negative relations and the number of annotated data in the samples are different in each dataset (ADE, BioInfer, reACE, Chemprot, and SemEval).</p>
<p>Nevertheless, the problem of class imbalance between datasets has been reported in the literature <sup>[<xref ref-type="bibr" rid="redalyc_344262226006_ref46">47</xref>]</sup>.</p>
<p>We observed that the model is sensitive to word representations, which plays a significant role in model training.  There are several embedding representations: position embedding (which represents the relative positions of entities and words in the sentence), medical and biological embedding (which contains specific information) in-domain word embedding (which includes methods that can generate domain-sensitive word embeddings).</p>
<p>Future studies can consider a similar reasoning, exploring, with combinations, different word representations (static, contextualized, with domain knowledge, and others).</p>
</sec>
<sec>
<title>
<bold>6. CONCLUSIONS</bold>
</title>
<p>In this paper, we proposed a DL model adapted to a new domain, more specifically, RE task for biomedical domain. We used an architecture to transfer the RE task from the generic domain to a biomedical one. After pre-processing the dataset, we obtained experimental results on several benchmark datasets. Nevertheless, we cannot confirm any advantage of the proposed model because it did not achieve a similar performance on different biomedical datasets or results comparable to those of SemEval 2010, which reached an F1-score of 82.76 (Baseline). Even though reACE, BioInfer, Chemprot, and ADE exhibited F1-scores of 25.24, 38.50, 59.80, and 99.56, respectively, these outputs cannot be rejected. We also analyzed the error and discuss the reasons behind our results.</p>
<p>Finally, our study explored different representations and results to avoid the duplicity of research efforts in the development of future systems.</p>
</sec>
</body>
<back>
<ref-list>
<title>
<bold>7. REFERENCES</bold>
</title>
<ref id="redalyc_344262226006_ref0">
<label>[1]</label>
<mixed-citation>[1]    D. Zeng, K. Liu, S. Lai, G. Zhou, and J. Zhao, “Relation Classification via Convolutional Deep Neural Network,” in <italic>Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers</italic>, Dublin, 2014, pp. 2335–2344. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C14-1220">https://www.aclweb.org/anthology/C14-1220</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
</person-group>
<source>Relation Classification via Convolutional Deep Neural Network</source>
<year>2344</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C14-1220">https://www.aclweb.org/anthology/C14-1220</ext-link>
</comment>
<conf-name>Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref1">
<label>[2]</label>
<mixed-citation>[2]    Y. Lin, S. Shen, Z. Liu, H. Luan, and M. Sun, “Neural Relation Extraction with Selective Attention over Instances,” <italic>in Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics</italic>, Berlín, 2016, vol. 1, pp. 2124–2133. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/P16-1200">http://dx.doi.org/10.18653/v1/P16-1200</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Luan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>M.</given-names>
</name>
</person-group>
<source>Neural Relation Extraction with Selective Attention over Instances</source>
<year>2133</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/P16-1200">http://dx.doi.org/10.18653/v1/P16-1200</ext-link>
</comment>
<conf-name>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref2">
<label>[3]</label>
<mixed-citation>[3]    <italic>X. Ren et al., “Cotype: Joint extraction of</italic> typed entities and relations with knowledge bases,” <italic>in Proceedings of the 26th International Conference on World Wide Web</italic>, Perth, 2017, pp. 1015–1024. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1145/3038912.3052708">http://doi.org/10.1145/3038912.3052708</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>X.</given-names>
</name>
</person-group>
<source>Cotype: Joint extraction of typed entities and relations with knowledge bases</source>
<year>2017</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1145/3038912.3052708">http://doi.org/10.1145/3038912.3052708</ext-link>
</comment>
<conf-name>Proceedings of the 26th International Conference on World Wide Web</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref3">
<label>[4]</label>
<mixed-citation>[4]    K. Toutanova, D. Chen, P. Pantel, H. Poon, P. Choudhury, and M. Gamon, “Representing Text for Joint Embedding of Text and Knowledge Bases,” <italic>in Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</italic>, Lisbon, 2015, pp. 1499–1509. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/D15-1174">http://dx.doi.org/10.18653/v1/D15-1174</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Toutanova</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pantel</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Poon</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Choudhury</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gamon</surname>
<given-names>M.</given-names>
</name>
</person-group>
<source>Representing Text for Joint Embedding of Text and Knowledge Bases</source>
<year>1509</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/D15-1174">http://dx.doi.org/10.18653/v1/D15-1174</ext-link>
</comment>
<conf-name>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref4">
<label>[5]</label>
<mixed-citation>[5]    N. Konstantinova, “Review of relation extraction methods: What is new out there?” <italic>in International Conference on Analysis of Images, Social Networks and Texts</italic>, Switzerland 2014, pp. 15–28. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1007/978-3-319-12580-0_2">http://doi.org/10.1007/978-3-319-12580-0_2</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Konstantinova</surname>
<given-names>N.</given-names>
</name>
</person-group>
<source>Review of relation extraction methods: What is new out there?</source>
<year>2014</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1007/978-3-319-12580-0_2">http://doi.org/10.1007/978-3-319-12580-0_2</ext-link>
</comment>
<conf-name>International Conference on Analysis of Images, Social Networks and Texts</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref5">
<label>[6]</label>
<mixed-citation>[6]    N. Kambhatla, “Combining lexical, syntactic, and semantic features with maximum entropy models for extracting relations,” <italic>in Proceedings of the ACL 2004 on Interactive poster and demonstration sessions -</italic>, Barcelona, 2004, pp. 1 - 4. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/1219044.1219066">https://doi.org/10.3115/1219044.1219066</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kambhatla</surname>
<given-names>N.</given-names>
</name>
</person-group>
<source>Combining lexical, syntactic, and semantic features with maximum entropy models for extracting relations</source>
<year>2004</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/1219044.1219066">https://doi.org/10.3115/1219044.1219066</ext-link>
</comment>
<conf-name>Proceedings of the ACL 2004 on Interactive poster and demonstration sessions</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref6">
<label>[7]</label>
<mixed-citation>[7]    R. C. Bunescu and R. J. Mooney, “A shortest path dependency kernel for relation extraction,” in <italic>Proceedings of the conference on Human Language Technology and Empirical Methods in Natural Language Processing - HLT ’05</italic>, Vancouver, 2005, pp. 724–731. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/H05-1091">https://www.aclweb.org/anthology/H05-1091</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Bunescu</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Mooney</surname>
<given-names>R. J.</given-names>
</name>
</person-group>
<source>A shortest path dependency kernel for relation extraction</source>
<year>2005</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/H05-1091">https://www.aclweb.org/anthology/H05-1091</ext-link>
</comment>
<conf-name>Proceedings of the conference on Human Language Technology and Empirical Methods in Natural Language Processing - HLT ’05</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref7">
<label>[8]</label>
<mixed-citation>[8]    R. J. Mooney and R. C. Bunescu, “Subsequence kernels for relation extraction,” <italic>in Advances in neural information processing systems</italic>, 2006, pp. 171–178. Avaliable: <ext-link ext-link-type="uri" xlink:href="http://papers.nips.cc/paper/2787-subsequence-kernels-for-relation-extraction.pdf">http://papers.nips.cc/paper/2787-subsequence-kernels-for-relation-extraction.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Mooney</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Bunescu</surname>
<given-names>R. C.</given-names>
</name>
</person-group>
<source>Subsequence kernels for relation extraction</source>
<year>2006</year>
<chapter-title>Subsequence kernels for relation extraction</chapter-title>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://papers.nips.cc/paper/2787-subsequence-kernels-for-relation-extraction.pdf">http://papers.nips.cc/paper/2787-subsequence-kernels-for-relation-extraction.pdf</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref8">
<label>[9]</label>
<mixed-citation>[9]    M. Banko, M. J. Cafarella, S. Soderland, M. Broadhead, and O. Etzioni, “Open information extraction from the web.,” in IJCAI, 2007, vol. 7, pp. 2670–2676. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aaai.org/Papers/IJCAI/2007/IJCAI07-429.pdf">https://www.aaai.org/Papers/IJCAI/2007/IJCAI07-429.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Banko</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cafarella</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Soderland</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Broadhead</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Etzioni</surname>
<given-names>O.</given-names>
</name>
</person-group>
<source>Open information extraction from the web</source>
<year>2676</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aaai.org/Papers/IJCAI/2007/IJCAI07-429.pdf">https://www.aaai.org/Papers/IJCAI/2007/IJCAI07-429.pdf</ext-link>
</comment>
<conf-name>Open information extraction from the web.</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref9">
<label>[10]</label>
<mixed-citation>[10] R. Socher, B. Huval, C. D. Manning, and A. Y. Ng, “Semantic compositionality through recursive matrix-vector spaces,”<italic>Proceedings of the 2012 Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning</italic>, Jeju Island, 2012, pp. 1201–1211. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/D12-1110">https://www.aclweb.org/anthology/D12-1110</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Socher</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Huval</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Manning</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>A. Y.</given-names>
</name>
</person-group>
<source>Semantic compositionality through recursive matrix-vector spaces</source>
<year>2012</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/D12-1110">https://www.aclweb.org/anthology/D12-1110</ext-link>
</comment>
<conf-name>Proceedings of the 2012 Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref10">
<label>[11]</label>
<mixed-citation>[11]  D. Zhang and D. Wang, “Relation Classification: CNN or RNN?,” in <italic>Natural Language Understanding and Intelligent Applications</italic>, Springer, Kunming, 2016, pp. 665–675. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-3-319-50496-4_60">https://doi.org/10.1007/978-3-319-50496-4_60</ext-link>
</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
</person-group>
<source>Relation Classification: CNN or RNN?</source>
<year>2016</year>
<chapter-title>Relation Classification: CNN or RNN?</chapter-title>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-3-319-50496-4_60">https://doi.org/10.1007/978-3-319-50496-4_60</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref11">
<label>[12]</label>
<mixed-citation>[12]  S. Lim and J. Kang, “Chemical–gene relation extraction using recursive neural network,” <italic>Database</italic>, vol. 2018, Jun. 2018. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/database/bay060">https://doi.org/10.1093/database/bay060</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>J.</given-names>
</name>
</person-group>
<article-title>Chemical–gene relation extraction using recursive neural network</article-title>
<source>Database</source>
<year>2018</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/database/bay060">https://doi.org/10.1093/database/bay060</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref12">
<label>[13]</label>
<mixed-citation>[13]  Y. Xu, L. Mou, G. Li, Y. Chen, H. Peng, and Z. Jin, “Classifying relations via long short term memory networks along shortest dependency paths,” <italic>in proceedings of the 2015 conference on empirical methods in natural language processing</italic>, Lisboa, 2015, pp. 1785–1794. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/d15-1206">http://doi.org/10.18653/v1/d15-1206</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Z.</given-names>
</name>
</person-group>
<source>Classifying relations via long short term memory networks along shortest dependency paths</source>
<year>1794</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/d15-1206">http://doi.org/10.18653/v1/d15-1206</ext-link>
</comment>
<conf-name>Proceedings of the 2015 conference on empirical methods in natural language processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref13">
<label>[14]</label>
<mixed-citation>[14] S. Zhang, D. Zheng, X. Hu, and M. Yang, “Bidirectional long short-term memory networks for relation classification,” <italic>in Proceedings of the 29th Pacific Asia conference on language, information and computation</italic>, Shanghai, 2015, pp. 73–78. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/Y15-1009.pdf">https://www.aclweb.org/anthology/Y15-1009.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>M.</given-names>
</name>
</person-group>
<source>Bidirectional long short-term memory networks for relation classification</source>
<year>2015</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/Y15-1009.pdf">https://www.aclweb.org/anthology/Y15-1009.pdf</ext-link>
</comment>
<conf-name>Proceedings of the 29th Pacific Asia conference on language, information and computation</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref14">
<label>[15]</label>
<mixed-citation>[15] R. Zhang, F. Meng, Y. Zhou, and B. Liu, “Relation classification via recurrent neural network with attention and tensor layers,” <italic>Big Data Min. Anal.</italic>, vol. 1, no. 3, pp. 234–244, Sep. 2018. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.26599/BDMA.2018.9020022">https://doi.org/10.26599/BDMA.2018.9020022</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
</person-group>
<article-title>Relation classification via recurrent neural network with attention and tensor layers</article-title>
<source>Big Data Min. Anal.</source>
<year>2018</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.26599/BDMA.2018.9020022">https://doi.org/10.26599/BDMA.2018.9020022</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref15">
<label>[16]</label>
<mixed-citation>[16]  T. H. Nguyen and R. Grishman, “Relation Extraction: Perspective from Convolutional Neural Networks,” in <italic>Proceedings of the 1st Workshop on Vector Space Modeling for Natural Language Processing</italic>, Denver, 2015, pp. 39–48. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/v1/W15-1506">https://doi.org/10.3115/v1/W15-1506</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Grishman</surname>
<given-names>R.</given-names>
</name>
</person-group>
<source>Relation Extraction: Perspective from Convolutional Neural Networks</source>
<year>2015</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/v1/W15-1506">https://doi.org/10.3115/v1/W15-1506</ext-link>
</comment>
<conf-name>Proceedings of the 1st Workshop on Vector Space Modeling for Natural Language Processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref16">
<label>[17]</label>
<mixed-citation>[17] C. dos Santos, B. Xiang, and B. Zhou, “Classifying Relations by Ranking with Convolutional Neural Networks,” in <italic>Proceedings of the 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 1: Long Papers)</italic>, Beijing, 2015, pp. 626–634. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/v1/P15-1061">https://doi.org/10.3115/v1/P15-1061</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>dos Santos</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>B.</given-names>
</name>
</person-group>
<source>Classifying Relations by Ranking with Convolutional Neural Networks</source>
<year>2015</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3115/v1/P15-1061">https://doi.org/10.3115/v1/P15-1061</ext-link>
</comment>
<conf-name>Proceedings of the 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing (Volume 1: Long Papers)</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref17">
<label>[18]</label>
<mixed-citation>[18] K. Xu, Y. Feng, S. Huang, and D. Zhao, “Semantic relation classification via convolutional neural networks with simple negative sampling,” in <italic>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, </italic>Lisbon, 2015, pp. 536-540. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/d15-1062">http://doi.org/10.18653/v1/d15-1062</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>D.</given-names>
</name>
</person-group>
<source>Semantic relation classification via convolutional neural networks with simple negative sampling</source>
<year>2015</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/d15-1062">http://doi.org/10.18653/v1/d15-1062</ext-link>
</comment>
<conf-name>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref18">
<label>[19]</label>
<mixed-citation>[19] A. Airola, S. Pyysalo, J. Björne, T. Pahikkala, F. Ginter, and T. Salakoski, “All-paths graph kernel for protein-protein interaction extraction with evaluation of cross-corpus learning,” <italic>BMC Bioinformatics</italic>, vol. 9, no. S 2, pp. 1-12, Nov. 2008.      <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-9-S11-S2">https://doi.org/10.1186/1471-2105-9-S11-S2</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Airola</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pyysalo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Björne</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pahikkala</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ginter</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Salakoski</surname>
<given-names>T.</given-names>
</name>
</person-group>
<article-title>All-paths graph kernel for protein-protein interaction extraction with evaluation of cross-corpus learning</article-title>
<source>BMC Bioinformatics</source>
<year>2008</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-9-S11-S2">https://doi.org/10.1186/1471-2105-9-S11-S2</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref19">
<label>[20]</label>
<mixed-citation>[20]  S. Kim, J. Yoon, J. Yang, and S. Park, “Walk-weighted subsequence kernels for protein-protein interaction extraction,” <italic>BMC Bioinformatics</italic>, vol. 11, no. 107, pp. 112–119, Feb. 2010. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-11-107">https://doi.org/10.1186/1471-2105-11-107</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yoon</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>S.</given-names>
</name>
</person-group>
<article-title>Walk-weighted subsequence kernels for protein-protein interaction extraction</article-title>
<source>BMC Bioinformatics</source>
<year>2010</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-11-107">https://doi.org/10.1186/1471-2105-11-107</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref20">
<label>[21]</label>
<mixed-citation>[21]  I. Segura-Bedmar, P. Martinez, and C. de Pablo-Sánchez, “Using a shallow linguistic kernel for drug–drug interaction extraction,” <italic>J. Biomed. Inform</italic>., vol. 44, no. 5, pp. 789–804, Oct. 2011. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jbi.2011.04.005">https://doi.org/10.1016/j.jbi.2011.04.005</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Segura-Bedmar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Martinez</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>de Pablo-Sánchez</surname>
<given-names>C.</given-names>
</name>
</person-group>
<article-title>Using a shallow linguistic kernel for drug–drug interaction extraction</article-title>
<source>J. Biomed. Inform.</source>
<year>2011</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jbi.2011.04.005">https://doi.org/10.1016/j.jbi.2011.04.005</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref21">
<label>[22]</label>
<mixed-citation>[22]  Y. Zhang, H. Lin, Z. Yang, J. Wang, and Y. Li, “A single kernel-based approach to extract drug-drug interactions from biomedical literature,” <italic>PLoS One</italic>, vol. 7, no. 11, pp. e48901, Nov. 2012.  <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0048901">https://doi.org/10.1371/journal.pone.0048901</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group>
<article-title>A single kernel-based approach to extract drug-drug interactions from biomedical literature</article-title>
<source>PLoS One</source>
<year>2012</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0048901">https://doi.org/10.1371/journal.pone.0048901</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref22">
<label>[23]</label>
<mixed-citation>[23]  K. Hashimoto, M. Miwa, Y. Tsuruoka, and T. Chikayama, “Simple customization of recursive neural networks for semantic relation classification,” <italic>in Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing</italic>, Seattle, 2013, pp. 1372–1376. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/D13-1137">https://www.aclweb.org/anthology/D13-1137</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Hashimoto</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Miwa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tsuruoka</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chikayama</surname>
<given-names>T.</given-names>
</name>
</person-group>
<source>Simple customization of recursive neural networks for semantic relation classification</source>
<year>2013</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/D13-1137">https://www.aclweb.org/anthology/D13-1137</ext-link>
</comment>
<conf-name>Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref23">
<label>[24]</label>
<mixed-citation>[24]  Y. Shen and X. Huang, “Attention-based convolutional neural network for semantic relation extraction,” <italic>in Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers</italic>, Osaka, 2016, pp. 2526–2536. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C16-1238">https://www.aclweb.org/anthology/C16-1238</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Shen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
</person-group>
<source>Attention-based convolutional neural network for semantic relation extraction</source>
<year>2536</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C16-1238">https://www.aclweb.org/anthology/C16-1238</ext-link>
</comment>
<conf-name>Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref24">
<label>[25]</label>
<mixed-citation>[25]  L. Wang, Z. Cao, G. de Melo, and Z. Liu, “Relation classification via multi-level attention cnns,” <italic>in Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</italic>, Berlin, 2016, vol. 1, pp. 1298–1307. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/P16-1123">http://doi.org/10.18653/v1/P16-1123</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>de Melo</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
</person-group>
<source>Relation classification via multi-level attention cnns</source>
<year>2016</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/P16-1123">http://doi.org/10.18653/v1/P16-1123</ext-link>
</comment>
<conf-name>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref25">
<label>[26]</label>
<mixed-citation>[26]  J. Lee, S. Seo, and Y. S. Choi, “Semantic Relation Classification via Bidirectional LSTM Networks with Entity-aware Attention using Latent Entity Typing,” <italic>Symmetry</italic>, vol. 11, no. 6, Jun. 2019. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/sym11060785">https://doi.org/10.3390/sym11060785</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Seo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>Y. S.</given-names>
</name>
</person-group>
<article-title>Semantic Relation Classification via Bidirectional LSTM Networks with Entity-aware Attention using Latent Entity Typing</article-title>
<source>Symmetry</source>
<year>2019</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/sym11060785">https://doi.org/10.3390/sym11060785</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref26">
<label>[27]</label>
<mixed-citation>[27]  M. Xiao and C. Liu, “Semantic relation classification via hierarchical recurrent neural network with attention,” in <italic>Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers</italic>, Osaka, 2016, pp. 1254–1263. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C16-1119">https://www.aclweb.org/anthology/C16-1119</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
</person-group>
<source>Semantic relation classification via hierarchical recurrent neural network with attention</source>
<year>2016</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/C16-1119">https://www.aclweb.org/anthology/C16-1119</ext-link>
</comment>
<conf-name>Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref27">
<label>[28]</label>
<mixed-citation>[28]  P. Zhou et al., “Attention-based bidirectional long short-term memory networks for relation classification,” <italic>in Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)</italic>, Berlin, 2016, pp. 207–212. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/p16-2034">http://doi.org/10.18653/v1/p16-2034</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>P.</given-names>
</name>
</person-group>
<source>Attention-based bidirectional long short-term memory networks for relation classification</source>
<year>2016</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/p16-2034">http://doi.org/10.18653/v1/p16-2034</ext-link>
</comment>
<conf-name>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref28">
<label>[29]</label>
<mixed-citation>[29]  R. Cai, X. Zhang, and H. Wang, “Bidirectional recurrent convolutional neural network for relation classification,” <italic>in Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers),</italic> Berlin, 2016, pp. 756–765.  <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/p16-1072">http://doi.org/10.18653/v1/p16-1072</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Cai</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group>
<source>Bidirectional recurrent convolutional neural network for relation classification</source>
<year>2016</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.18653/v1/p16-1072">http://doi.org/10.18653/v1/p16-1072</ext-link>
</comment>
<conf-name>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref29">
<label>[30]</label>
<mixed-citation>[30]  Y. Xu et al., “Improved relation classification by deep recurrent neural networks with data augmentation,” <italic>ArXiv Prepr.</italic>, Oct. 2016. Available: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1601.03651">https://arxiv.org/abs/1601.03651</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
</person-group>
<article-title>Improved relation classification by deep recurrent neural networks with data augmentation</article-title>
<source>ArXiv Prepr.</source>
<year>1601</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1601.03651">https://arxiv.org/abs/1601.03651</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref30">
<label>[31]</label>
<mixed-citation>[31]  Y. Liu, F. Wei, S. Li, H. Ji, M. Zhou, and H. Wang, “A dependency-based neural network for relation classification,” <italic>ArXiv Prepr.,</italic> pp.1-10, Jul. 2015. Available: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/pdf/1507.04646.pdf">https://arxiv.org/pdf/1507.04646.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group>
<article-title>A dependency-based neural network for relation classification</article-title>
<source>ArXiv Prepr.</source>
<year>1507</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://arxiv.org/pdf/1507.04646.pdf">https://arxiv.org/pdf/1507.04646.pdf</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref31">
<label>[32]</label>
<mixed-citation>[32]  M. Yu, M. Gormley, and M. Dredze, “Factor-based compositional embedding models.” <italic>In NIPS Workshop on Learning Semantics, </italic>2014, pp. 95-101. Available: <ext-link ext-link-type="uri" xlink:href="https://www.cs.cmu.edu/~mgormley/papers/yu+gormley+dredze.nipsw.2014.pdf">https://www.cs.cmu.edu/~mgormley/papers/yu+gormley+dredze.nipsw.2014.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gormley</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dredze</surname>
<given-names>M.</given-names>
</name>
</person-group>
<source>NIPS Workshop on Learning Semantics</source>
<year>2014</year>
<chapter-title>Factor-based compositional embedding models</chapter-title>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.cs.cmu.edu/~mgormley/papers/yu+gormley+dredze.nipsw.2014.pdf">https://www.cs.cmu.edu/~mgormley/papers/yu+gormley+dredze.nipsw.2014.pdf</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref32">
<label>[33]</label>
<mixed-citation>[33]  S. Lai, L. Xu, K. Liu, and J. Zhao, “Recurrent convolutional neural networks for text classification,” <italic>in Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence,</italic> Austin, 2015, pp. 2267-2273. Available: <ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/10.5555/2886521.2886636">https://dl.acm.org/doi/10.5555/2886521.2886636</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Lai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
</person-group>
<source>Recurrent convolutional neural networks for text classification</source>
<year>2273</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/10.5555/2886521.2886636">https://dl.acm.org/doi/10.5555/2886521.2886636</ext-link>
</comment>
<conf-name>Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref33">
<label>[34]</label>
<mixed-citation>[34]  D. Zeng, K. Liu, Y. Chen, and J. Zhao, “Distant supervision for relation extraction via piecewise convolutional neural networks,” <italic>in Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</italic>, Lisbon, 2015, pp. 1753–1762. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/D15-1203">http://dx.doi.org/10.18653/v1/D15-1203</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
</person-group>
<source>Distant supervision for relation extraction via piecewise convolutional neural networks</source>
<year>1762</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.18653/v1/D15-1203">http://dx.doi.org/10.18653/v1/D15-1203</ext-link>
</comment>
<conf-name>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref34">
<label>[35]</label>
<mixed-citation>[35]  S. Pawar, G. K. Palshikar, and P. Bhattacharyya, “Relation Extraction: A Survey,” <italic>ArXiv Prepr</italic>. ArXiv171205191, Dec. 2017. Available: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/pdf/1712.05191.pdf">https://arxiv.org/pdf/1712.05191.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Palshikar</surname>
<given-names>G. K.</given-names>
</name>
<name>
<surname>Bhattacharyya</surname>
<given-names>P.</given-names>
</name>
</person-group>
<article-title>Relation Extraction: A Survey</article-title>
<source>ArXiv Prepr.</source>
<year>1712</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://arxiv.org/pdf/1712.05191.pdf">https://arxiv.org/pdf/1712.05191.pdf</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref35">
<label>[36]</label>
<mixed-citation>[36]  J. Legrand et al., “PGxCorpus: A Manually Annotated Corpus for Pharmacogenomics,” <italic>bioRxiv</italic>, Jan. 2019. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/534388">https://doi.org/10.1101/534388</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Legrand</surname>
<given-names>J.</given-names>
</name>
</person-group>
<article-title>PGxCorpus: A Manually Annotated Corpus for Pharmacogenomics</article-title>
<source>bioRxiv</source>
<year>2019</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/534388">https://doi.org/10.1101/534388</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref36">
<label>[37]</label>
<mixed-citation>[37]          Y. LeCun, L. Bottou, Y. Bengio, P. Haffner, “Gradient-based learning applied to document recognition,” <italic>Proc. IEEE</italic>, vol. 86, no. 11, pp. 2278–2324, Nov. 1998. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1109/5.726791">http://doi.org/10.1109/5.726791</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>LeCun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Bottou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Haffner</surname>
<given-names>P.</given-names>
</name>
</person-group>
<article-title>Gradient-based learning applied to document recognition</article-title>
<source>Proc. IEEE</source>
<year>1998</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1109/5.726791">http://doi.org/10.1109/5.726791</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref37">
<label>[38]</label>
<mixed-citation>[38]  T. Mikolov, I. Sutskever, K. Chen, G. S. Corrado, and J. Dean, “Distributed representations of words and phrases and their compositionality,” <italic>in Advances in neural information processing systems</italic>, Lake Tahoe, Nevada, 2013, pp. 3111–3119. Available: <ext-link ext-link-type="uri" xlink:href="https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf">https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Mikolov</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sutskever</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Corrado</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Dean</surname>
<given-names>J.</given-names>
</name>
</person-group>
<source>Distributed representations of words and phrases and their compositionality</source>
<year>2013</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf">https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf</ext-link>
</comment>
<conf-name>Advances in neural information processing systems</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref38">
<label>[39]</label>
<mixed-citation>[39]  J. Pennington, R. Socher, and C. Manning, “Glove: Global Vectors for Word Representation,” <italic>in Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP</italic>), Doha, Qatar, 2014, pp. 1532–1543. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.3115/v1/D14-1162">http://dx.doi.org/10.3115/v1/D14-1162</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Pennington</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Socher</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Manning</surname>
<given-names>C.</given-names>
</name>
</person-group>
<source>Glove: Global Vectors for Word Representation</source>
<year>1543</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.3115/v1/D14-1162">http://dx.doi.org/10.3115/v1/D14-1162</ext-link>
</comment>
<conf-name>Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref39">
<label>[40]</label>
<mixed-citation>[40]  J. Turian, L. Ratinov, and Y. Bengio, “Word representations: a simple and general method for semi-supervised learning,” <italic>in Proceedings of the 48th annual meeting of the association for computational linguistics</italic>, Uppsala, 2010, pp. 384–394. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/P10-1040">https://www.aclweb.org/anthology/P10-1040</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Turian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ratinov</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
</person-group>
<source>Word representations: a simple and general method for semi-supervised learning</source>
<year>2010</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/P10-1040">https://www.aclweb.org/anthology/P10-1040</ext-link>
</comment>
<conf-name>Proceedings of the 48th annual meeting of the association for computational linguistics</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref40">
<label>[41]</label>
<mixed-citation>[41]  P. Bojanowski, E. Grave, A. Joulin, and T. Mikolov, “Enriching word vectors with subword information,” <italic>Trans. Assoc. Comput. Linguist</italic>., vol. 5, pp. 135–146, Jun. 2017. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1162/tacl_a_00051">http://dx.doi.org/10.1162/tacl_a_00051</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bojanowski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Grave</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Joulin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mikolov</surname>
<given-names>T.</given-names>
</name>
</person-group>
<article-title>Enriching word vectors with subword information</article-title>
<source>Trans. Assoc. Comput. Linguist.</source>
<year>2017</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1162/tacl_a_00051">http://dx.doi.org/10.1162/tacl_a_00051</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref41">
<label>[42]</label>
<mixed-citation>[42]  S. Pyysalo et al., “BioInfer: a corpus for information extraction in the biomedical domain,” <italic>BMC Bioinformatics</italic>, vol. 8, no. 50, Feb. 2007. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-8-50">https://doi.org/10.1186/1471-2105-8-50</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pyysalo</surname>
<given-names>S.</given-names>
</name>
</person-group>
<article-title>BioInfer: a corpus for information extraction in the biomedical domain</article-title>
<source>BMC Bioinformatics</source>
<year>2007</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-8-50">https://doi.org/10.1186/1471-2105-8-50</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref42">
<label>[43]</label>
<mixed-citation>[43]  H. Gurulingappa, A. M. Rajput, A. Roberts, J. Fluck, M. Hofmann-Apitius, and L. Toldo, “Development of a benchmark corpus to support the automatic extraction of drug-related adverse effects from medical case reports,” <italic>J. Biomed. Inform</italic>., vol. 45, no. 5, pp. 885–892, Oct. 2012. <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.jbi.2012.04.008">http://dx.doi.org/10.1016/j.jbi.2012.04.008</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gurulingappa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rajput</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fluck</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hofmann-Apitius</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Toldo</surname>
<given-names>L.</given-names>
</name>
</person-group>
<article-title>Development of a benchmark corpus to support the automatic extraction of drug-related adverse effects from medical case reports</article-title>
<source>J. Biomed. Inform.</source>
<year>2012</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.jbi.2012.04.008">http://dx.doi.org/10.1016/j.jbi.2012.04.008</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref43">
<label>[44]</label>
<mixed-citation>[44]  J. Kringelum, S. K. Kjaerulff, S. Brunak, O. Lund, T. I. Oprea, and O. Taboureau, “ChemProt-3.0: a global chemical biology diseases mapping,” <italic>Database</italic>, Feb. 2016. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/database/bav123">https://doi.org/10.1093/database/bav123</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kringelum</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kjaerulff</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Brunak</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lund</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Oprea</surname>
<given-names>T. I.</given-names>
</name>
<name>
<surname>Taboureau</surname>
<given-names>O.</given-names>
</name>
</person-group>
<article-title>ChemProt-3.0: a global chemical biology diseases mapping</article-title>
<source>Database</source>
<year>2016</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/database/bav123">https://doi.org/10.1093/database/bav123</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref44">
<label>[45]</label>
<mixed-citation>[45]  I. Hendrickx et al., “Semeval-2010 task 8: Multi-way classification of semantic relations between pairs of nominals” <italic>in Proceedings of the Workshop on Semantic Evaluations</italic>, Uppsala, 2010, pp. 33–38. Avaliable: <ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/S10-1006">https://www.aclweb.org/anthology/S10-1006</ext-link>/</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Hendrickx</surname>
<given-names>I.</given-names>
</name>
</person-group>
<source>Semeval-2010 task 8: Multi-way classification of semantic relations between pairs of nominals</source>
<year>2010</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://www.aclweb.org/anthology/S10-1006">https://www.aclweb.org/anthology/S10-1006</ext-link>
</comment>
<conf-name>Proceedings of the Workshop on Semantic Evaluations</conf-name>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref45">
<label>[46]</label>
<mixed-citation>[46]  B. Hachey, C. Grover, and R. Tobin, “Datasets for generic relation extraction” <italic>Nat. Lang. Eng</italic>., vol. 18, no. 1, pp. 21–59, Jan. 2012. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1017/s1351324911000106">https://doi.org/10.1017/s1351324911000106</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hachey</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Grover</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tobin</surname>
<given-names>R.</given-names>
</name>
</person-group>
<article-title>Datasets for generic relation extraction</article-title>
<source>Nat. Lang. Eng.</source>
<year>2012</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1017/s1351324911000106">https://doi.org/10.1017/s1351324911000106</ext-link>
</comment>
</element-citation>
</ref>
<ref id="redalyc_344262226006_ref46">
<label>[47]</label>
<mixed-citation>[47]  T. Ming Harry Hsu, W. Yu Chen, C.-A. Hou, Y.-H. Hubert Tsai, Y.-R. Yeh, and Y.-C. Frank Wang, “Unsupervised domain adaptation with imbalanced cross-domain data,” <italic>in Proceedings of the IEEE International Conference on Computer Vision</italic>, Santiago de Chile, 2015, pp. 4121–4129. <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1109/iccv.2015.469">http://doi.org/10.1109/iccv.2015.469</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ming Harry Hsu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Yu Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>C.-A.</given-names>
</name>
<name>
<surname>Hubert Tsai</surname>
<given-names>Y.-H.</given-names>
</name>
<name>
<surname>Yeh</surname>
<given-names>Y.-R.</given-names>
</name>
<name>
<surname>Frank Wang</surname>
<given-names>Y.-C.</given-names>
</name>
</person-group>
<source>Unsupervised domain adaptation with imbalanced cross-domain data</source>
<year>2015</year>
<comment>
<ext-link ext-link-type="uri" xlink:href="http://doi.org/10.1109/iccv.2015.469">http://doi.org/10.1109/iccv.2015.469</ext-link>
</comment>
<conf-name>Proceedings of the IEEE International Conference on Computer Vision</conf-name>
</element-citation>
</ref>
</ref-list>
</back>
</article>