<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v6i4e12159</article-id>
    <article-id pub-id-type="pmid">30478023</article-id>
    <article-id pub-id-type="doi">10.2196/12159</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Extraction of Information Related to Adverse Drug Events from Electronic Health Record Notes: Design of an End-to-End Model Based on Deep Learning</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Miller</surname>
          <given-names>Heather</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Liu</surname>
          <given-names>Mei</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1">
        <name name-style="western">
          <surname>Li</surname>
          <given-names>Fei</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1816-1761</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Liu</surname>
          <given-names>Weisong</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3825-5597</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3" corresp="yes">
      <name name-style="western">
        <surname>Yu</surname>
        <given-names>Hong</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Department of Computer Science</institution>
        <institution>University of Massachusetts Lowell</institution>
        <addr-line>1 University Avenue</addr-line>
        <addr-line>Lowell, MA,</addr-line>
        <country>United States</country>
        <phone>1 508 612 7292</phone>
        <email>Hong_Yu@uml.edu</email>
      </address>  
      <xref rid="aff2" ref-type="aff">2</xref>
      <xref rid="aff3" ref-type="aff">3</xref>
      <xref rid="aff4" ref-type="aff">4</xref>
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9263-5035</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
    <label>1</label>
    <institution>Department of Computer Science</institution>
    <institution>University of Massachusetts Lowell</institution>  
    <addr-line>Lowell, MA</addr-line>
    <country>United States</country></aff>
    <aff id="aff2">
    <label>2</label>
    <institution>Center for Healthcare Organization and Implementation Research</institution>
    <institution>Bedford Veterans Affairs Medical Center</institution>  
    <addr-line>Bedford, MA</addr-line>
    <country>United States</country></aff>
    <aff id="aff3">
    <label>3</label>
    <institution>Department of Medicine</institution>
    <institution>University of Massachusetts Medical School</institution>  
    <addr-line>Worcester, MA</addr-line>
    <country>United States</country></aff>
    <aff id="aff4">
    <label>4</label>
    <institution>School of Computer Science</institution>
    <institution>University of Massachusetts</institution>  
    <addr-line>Amherst, MA</addr-line>
    <country>United States</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Hong Yu 
      <email>Hong_Yu@uml.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Oct-Dec</season><year>2018</year></pub-date>
    <pub-date pub-type="epub">
      <day>26</day>
      <month>11</month>
      <year>2018</year>
    </pub-date>
    <volume>6</volume>
    <issue>4</issue>
    <elocation-id>e12159</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>12</day>
        <month>9</month>
        <year>2018</year>
      </date>
      <date date-type="rev-request">
        <day>8</day>
        <month>10</month>
        <year>2018</year>
      </date>
      <date date-type="rev-recd">
        <day>31</day>
        <month>10</month>
        <year>2018</year>
      </date>
      <date date-type="accepted">
        <day>9</day>
        <month>11</month>
        <year>2018</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Fei Li, Weisong Liu, Hong Yu. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 26.11.2018.</copyright-statement>
    <copyright-year>2018</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://medinform.jmir.org/2018/4/e12159/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Pharmacovigilance and drug-safety surveillance are crucial for monitoring adverse drug events (ADEs), but the main ADE-reporting systems such as Food and Drug Administration Adverse Event Reporting System face challenges such as underreporting. Therefore, as complementary surveillance, data on ADEs are extracted from electronic health record (EHR) notes via natural language processing (NLP). As NLP develops, many up-to-date machine-learning techniques are introduced in this field, such as deep learning and multi-task learning (MTL). However, only a few studies have focused on employing such techniques to extract ADEs.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>We aimed to design a deep learning model for extracting ADEs and related information such as medications and indications. Since extraction of ADE-related information includes two steps—named entity recognition and relation extraction—our second objective was to improve the deep learning model using multi-task learning between the two steps.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>We employed the dataset from the Medication, Indication and Adverse Drug Events (MADE) 1.0 challenge to train and test our models. This dataset consists of 1089 EHR notes of cancer patients and includes 9 entity types such as Medication, Indication, and ADE and 7 types of relations between these entities. To extract information from the dataset, we proposed a deep-learning model that uses a bidirectional long short-term memory (BiLSTM) conditional random field network to recognize entities and a BiLSTM-Attention network to extract relations. To further improve the deep-learning model, we employed three typical MTL methods, namely, hard parameter sharing, parameter regularization, and task relation learning, to build three MTL models, called HardMTL, RegMTL, and LearnMTL, respectively.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>Since extraction of ADE-related information is a two-step task, the result of the second step (ie, relation extraction) was used to compare all models. We used microaveraged precision, recall, and F1 as evaluation metrics. Our deep learning model achieved state-of-the-art results (F1=65.9%), which is significantly higher than that (F1=61.7%) of the best system in the MADE1.0 challenge. HardMTL further improved the F1 by 0.8%, boosting the F1 to 66.7%, whereas RegMTL and LearnMTL failed to boost the performance.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Deep learning models can significantly improve the performance of ADE-related information extraction. MTL may be effective for named entity recognition and relation extraction, but it depends on the methods, data, and other factors. Our results can facilitate research on ADE detection, NLP, and machine learning.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>adverse drug event</kwd>
      <kwd>deep learning</kwd>
      <kwd>multi-task learning</kwd>
      <kwd>named entity recognition</kwd>
      <kwd>natural language processing</kwd>
      <kwd>relation extraction</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>An adverse drug event (ADE) is an injury resulting from a medical drug intervention [<xref ref-type="bibr" rid="ref1">1</xref>]. Previous studies reported that ADEs could account for up to 41% of all hospital admissions [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. An ADE may cause a prolonged length of stay in the hospital and increase the economic burden [<xref ref-type="bibr" rid="ref4">4</xref>]. The annual cost of ADEs for a 700-bed hospital is approximately $5.6 million [<xref ref-type="bibr" rid="ref5">5</xref>]. Moreover, the total number of iatrogenic deaths can reach nearly 800,000 per year, which is higher than the death rate of heart disease or cancer [<xref ref-type="bibr" rid="ref6">6</xref>]. In 2013, medical error, including ADEs, is the third most-common cause of death in the United States [<xref ref-type="bibr" rid="ref7">7</xref>]. Therefore, ADE detection and report are crucial for pharmacovigilance and drug-safety surveillance [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>Two methods are usually used to detect and report ADE. In premarketing surveillance, ADEs can be discovered during phase III clinical trials for drug development. In postmarketing surveillance, ADEs are discovered by patients and physicians using the Food and Drug Administration (FDA) Adverse Event Reporting System (FAERS). These traditional methods are limited by the number of participants [<xref ref-type="bibr" rid="ref10">10</xref>], underreporting [<xref ref-type="bibr" rid="ref11">11</xref>], and missing patterns of drug exposure [<xref ref-type="bibr" rid="ref12">12</xref>]; for example, underreporting is a known issue in FAERS and may occur due to several reasons. First, the objective and content of the report in FAERS change over time, which may confuse physicians and the general public. Second, patients may choose not to mention some reactions, due to which practitioners fail to report them. Third, ADEs with long latency or producing unusual symptoms may be unrecognized. Other reasons may include payments from pharmaceutical companies to doctors [<xref ref-type="bibr" rid="ref13">13</xref>] and inefficient communication between patients, physicians, and pharmacists. Recently, the FDA made the FAERS data available through a public dashboard [<xref ref-type="bibr" rid="ref14">14</xref>]. Since anyone can view ADE reports online, this venture may help the FDA receive feedback to improve the FAERS.</p>
        <p>Many researchers have used other resources to identify ADEs, such as biomedical publications [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], social media [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], and electronic health record (EHR) notes [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. The ADEs extracted from these resources are an important complement to traditional ADE-surveillance systems. However, manual collection of ADEs from these data is laborious [<xref ref-type="bibr" rid="ref22">22</xref>]. As such, the use of computer systems is a good choice to automatically detect ADEs, but may fail since these data are often unstructured text. Therefore, natural language processing (NLP) techniques are employed for this significant task [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>From the viewpoint of NLP, ADE detection is covered under the task of information extraction, which includes ADE extraction as well as information related to ADE, such as medications and indications. Extraction of ADE-related information can be casted as a two-step pipeline. The first step is named entity recognition (NER) [<xref ref-type="bibr" rid="ref24">24</xref>], which recognizes a string of text as an entity (eg, medication or ADE) that is predefined by dataset annotators. The second step is relation extraction (RE) [<xref ref-type="bibr" rid="ref15">15</xref>], which is a model that determines whether two entities have a specific relation (eg, ﻿medication and ADE).</p>
        <p>Previous studies employed traditional machine-learning techniques [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] such as condition random field (CRF) [<xref ref-type="bibr" rid="ref25">25</xref>] or support vector machine (SVM) [<xref ref-type="bibr" rid="ref26">26</xref>]. Recently, deep learning attracted much attention in NLP due its numerous advantages such as better performances and less feature engineering compared to other systems [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. However, only a few studies have addressed extraction of ADE-related information via deep learning. Since ADE detection can be divided into two tasks (ie, NER and RE), it is logical to incorporate multi-task learning (MTL) [<xref ref-type="bibr" rid="ref29">29</xref>] into ADE detection. However, only limited prior work has investigated the impact of MTL on ADE detection.</p>
      </sec>
      <sec>
        <title>Relevant Literature</title>
        <sec>
          <title>Adverse Drug Event Detection</title>
          <p>Since ADEs play an important role in drug-safety surveillance, ADE detection receives increasing attention from both the federal regulation and the research community. Besides the official reporting system FAERS, there are other databases that collect data on known ADEs, such as the Comparative Toxicogenomics Database [<xref ref-type="bibr" rid="ref30">30</xref>] and SIDER [<xref ref-type="bibr" rid="ref31">31</xref>]. Various resources have been used to detect ADEs, such as biomedical publications [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], social media [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], and electronic health record (EHR) notes [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. For example, Gurulingappa et al [<xref ref-type="bibr" rid="ref16">16</xref>] leveraged medical case reports to build a corpus in order to support drug-related adverse effects. Wei et al [<xref ref-type="bibr" rid="ref15">15</xref>] organized a challenge task to extract chemical-induced disease relations from the literature and created an annotated corpus from 1500 articles. With respect to the methods, both supervised and unsupervised methods were used. Ramesh et al [<xref ref-type="bibr" rid="ref32">32</xref>] developed a supervised machine-learning model to extract adverse event entities from FAERS narratives. Xu and Wang [<xref ref-type="bibr" rid="ref33">33</xref>] used a semisupervised bootstrapped method to construct a knowledge base for the drug-side-effect association. Liu et al [<xref ref-type="bibr" rid="ref34">34</xref>] proposed a causality-analysis model based on structure learning for identifying factors that contribute to adverse drug reactions. Yildirim et al [<xref ref-type="bibr" rid="ref35">35</xref>] applied the k-mean algorithm to identify adverse reactions. Xu et al [<xref ref-type="bibr" rid="ref23">23</xref>] used SVM to extract ADEs between sentence-level and document-level drug-disease pairs. Recently, Munkhdalai et al [<xref ref-type="bibr" rid="ref21">21</xref>] attempted to use deep learning to address ADE extraction, but their model was not end-to-end and relied on the entities.</p>
          
                  <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Study overview. NER: named entity recognition. RE: relation extraction. BiLSTM: bidirectional long short-term-memory. CRF: conditional random field. MTL: multi-task learning. MADE: Medication, Indication, and Adverse Drug Events. HardMTL: multi-task learning model for hard parameter sharing. RegMTL: multi-task learning model for soft parameter sharing based on regularization. LearnMTL: multi-task learning model for soft parameter sharing based on task-relation learning.</p>
          </caption>
          <graphic xlink:href="medinform_v6i4e12159_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
          
        </sec>
        <sec>
          <title>Named Entity Recognition</title>
          <p>NER is a standard task that has been studied for many years in NLP [<xref ref-type="bibr" rid="ref25">25</xref>]. Many researchers made important contributions to dataset construction including the GENIA corpus [<xref ref-type="bibr" rid="ref36">36</xref>], the NCBI disease corpus [<xref ref-type="bibr" rid="ref37">37</xref>], and the ShARe/CLEF eHealth evaluation [<xref ref-type="bibr" rid="ref38">38</xref>]. Early studies addressed NER by diverse approaches such as rule-based [<xref ref-type="bibr" rid="ref39">39</xref>] and machine-learning approaches [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>], among which CRF-based approaches predominated. For example, Campos et al [<xref ref-type="bibr" rid="ref40">40</xref>] presented a CRF model to recognize biomedical names, which achieved state-of-the-art performance at the time by incorporating rich features. Tang et al [<xref ref-type="bibr" rid="ref43">43</xref>] modified the label scheme of CRF to make it be capable of recognizing disjoint clinical concepts. However, such approaches need many efforts for feature engineering. Recently, a bidirectional LSTM (BiLSTM) model [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>] was proposed and became a popular method for NER. In the biomedical domain, Jagannatha and Yu [<xref ref-type="bibr" rid="ref20">20</xref>] used such a model to detect medical events from EHR notes.</p>
        </sec>
        <sec>
          <title>Relation Extraction</title>
          <p>RE has been widely studied, and some typical RE corpora in the biomedical domain include the 2010 i2b2/VA challenge [<xref ref-type="bibr" rid="ref46">46</xref>] and BioCreative V CDR task [<xref ref-type="bibr" rid="ref15">15</xref>]. Early work used rules and NLP structures such as dependency trees [<xref ref-type="bibr" rid="ref47">47</xref>] and coreference chains [<xref ref-type="bibr" rid="ref48">48</xref>] to help extract relations. Others usually leveraged machine-learning approaches such as SVM [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] and structured learning [<xref ref-type="bibr" rid="ref51">51</xref>]. As deep learning developed, researchers proposed a number of neural network models to handle RE [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]. Our study is related to the joint or end-to-end entity and RE, which allows performance of NER and RE simultaneously. Miwa and Bansal [<xref ref-type="bibr" rid="ref54">54</xref>] proposed an end-to-end model based on the sequence and tree LSTM. Similarly, Mehryary et al [<xref ref-type="bibr" rid="ref55">55</xref>] proposed an end-to-end system to extract information about bacteria and their habitats.</p>
        </sec>
        <sec>
          <title>Multi-Task Learning</title>
          <p>MTL [<xref ref-type="bibr" rid="ref29">29</xref>] refers to training the model for multiple related tasks. It is widely used in artificial intelligence research such as computer vision [<xref ref-type="bibr" rid="ref56">56</xref>] and NLP [<xref ref-type="bibr" rid="ref57">57</xref>]. Learning these tasks simultaneously may improve the performance as compared to learning the tasks individually. Prior MTL studies mostly focused on homogeneous MTL that consists of tasks with only one type such as classification or regression [<xref ref-type="bibr" rid="ref58">58</xref>]. Some of their tasks are closely related, such as cross-lingual [<xref ref-type="bibr" rid="ref59">59</xref>] and synthetic data [<xref ref-type="bibr" rid="ref60">60</xref>]. Based on a previous study [<xref ref-type="bibr" rid="ref58">58</xref>], MTL can be roughly divided into two categories—hard and soft parameter sharing. For hard parameter sharing, the lower layers are shared among multiple tasks and each task has its own higher layer [<xref ref-type="bibr" rid="ref54">54</xref>]. For soft parameter sharing, each task has its own model with its own parameters. There are some representative methods for soft parameter sharing such as regularization [<xref ref-type="bibr" rid="ref59">59</xref>] or learning task relations [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Objective</title>
        <p>Since only a few prior studies have addressed end-to-end detection of ADE via deep learning, we aimed to design a two-step pipeline model that consists of two submodels: a BiLSTM [<xref ref-type="bibr" rid="ref61">61</xref>] CRF [<xref ref-type="bibr" rid="ref25">25</xref>] network for NER and a BiLSTM-Attention [<xref ref-type="bibr" rid="ref62">62</xref>] network for RE. Since extraction of ADE-related information includes two steps, it is possible to study the impact of MTL on NER and RE. However, only limited prior work has focused on MTL with such heterogeneous and loosely related tasks. Therefore, our second objective was to fill this gap by proposing three MTL models and comparing them with the pipeline model. An overview of this study is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p>

      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Deep Learning Pipeline Model</title>
        <sec>
          <title>BiLSTM-CRF Submodel for NER</title>
          <p>Our NER submodel is presented in <xref ref-type="fig" rid="figure2">Figure 2</xref>. We extended the state-of-the-art BiLSTM-CRF model [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>] by enriching its features. For a sentence, we extracted four kinds of features for each token, namely, its word, whether the initial character is capital, its part-of-speech (POS) tag, and its character representation. We employed a convolutional neural network to obtain character representation. After the token representations are obtained by concatenating the features, we fed them into a bidirectional LSTM layer to learn the hidden representations. Subsequently, the hidden representations were input into the CRF layer to determine the optimal labels for all the tokens in the sentence. For labels, we use the BMES (Begin, Middle, End, Singular) label scheme [<xref ref-type="bibr" rid="ref45">45</xref>] plus entity types. For example, the label of the token “Renal” is “B_Disease.” The details of the BiLSTM-CRF submodel for NER are provided in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>

        </sec>
        <sec>
          <title>BiLSTM-Attention Submodel for RE</title>
          <p>Our RE submodel is presented in <xref ref-type="fig" rid="figure3">Figure 3</xref>. A relation instance can be considered as a token sequence and two target entities. Here, the token sequence did not necessarily have to be one sentence, as we could also extract intersentence relations. For each token, we extracted four kinds of features, namely, its word, its POS tag, and the position embeddings [<xref ref-type="bibr" rid="ref63">63</xref>]. Here, the character representation was not used, because it reduced the performance in our preliminary experiments. Similar to the case for NER, we employed a BiLSTM layer to generate the hidden representations. Subsequently, the attention method [<xref ref-type="bibr" rid="ref62">62</xref>] was used to obtain context features.</p>
          <p>Because only context features may not be enough to capture the semantic relation, we also employed other features for concision, which are not shown in <xref ref-type="fig" rid="figure3">Figure 3</xref>. Considering previous work [<xref ref-type="bibr" rid="ref21">21</xref>], these features included words of two target entities, types of two target entities, the token number between two target entities, and the entity number between two target entities. Like the word or POS embeddings, these features can be represented as vectors. Therefore, the output layer considers the concatenation of all these features to determine the relation of target entities. The details of the BiLSTM-Attention submodel for RE are provided in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>.</p>
        </sec>
      </sec>
      <sec>
        <title>Multi-Task Learning Models</title>
        <p>In this section, we propose three MTL models: one model used hard parameter sharing [<xref ref-type="bibr" rid="ref54">54</xref>] and two models used soft parameter sharing, namely, regularization [<xref ref-type="bibr" rid="ref59">59</xref>] and task relation learning [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <sec>
          <title>HardMTL</title>
          <p>Our MTL model for hard parameter sharing is presented in <xref ref-type="fig" rid="figure4">Figure 4</xref>. We employed the shared-private architecture [<xref ref-type="bibr" rid="ref64">64</xref>] to make each submodel of each task retain its private parts and share some parts for multi-task learning. The NER and RE submodels had their own BiLSTM layers, namely, <italic>LSTM</italic><sup><italic>ner</italic> </sup> and <italic>LSTM</italic><sup><italic>re</italic> </sup>, and shared a BiLSTM layer, <italic>LSTM</italic><sup><italic>share</italic> </sup>. During training, the shared BiLSTM layer <italic>LSTM</italic><sup><italic>share</italic> </sup> was used by both the NER and RE submodels, so that it was tuned during the back-propagation by both submodels. Therefore, the model was able to learn useful knowledge from both tasks. The details of the HardMTL model are provided in <xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>.</p>
        </sec>
        <sec>
          <title>RegMTL</title>
          <p>Our first MTL model for soft parameter sharing was based on regularization, and its architecture is presented in <xref ref-type="fig" rid="figure5">Figure 5</xref>. With reference to previous studies [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], we employed the L2 regularization in order to encourage the parameters of the NER and RE submodels to be similar instead of sharing some parts in the networks. Two BiLSTM layers were considered because different inputs of the NER and RE submodels lead to different dimensions of the first BiLSTM layer; therefore, L2 regularization of the parameters of the first BiLSTM layer was computationally intractable. We resolved this issue by performing L2 regularization in the second BiLSTM layer. The details of the RegMTL model are provided in <xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>.</p>
        </sec>
        <sec>
          <title>LearnMTL</title>
          <p>Our second MTL model for soft parameter sharing was based on task relation learning [<xref ref-type="bibr" rid="ref56">56</xref>], and its architecture is illustrated in <xref ref-type="fig" rid="figure6">Figure 6</xref>. After generating hidden representations from the BiLSTM and attention layers, we used a linear layer, <italic>W</italic><sub><italic>5</italic> </sub>, to exchange information between the NER and RE submodels. To utilize task-specific and shared information, the concatenation of hidden representations of the BiLSTM and information exchange layers was fed into the upper decoders <italic>D</italic><sup><italic>ner</italic> </sup> and <italic>D</italic><sup><italic>re</italic> </sup>. The details of the LearnMTL model are provided in <xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>.</p>
        </sec>
      </sec>
      <sec>
        <title>Dataset</title>
        <p>We used the MADE dataset from the MADE1.0 challenge for detecting medications and ADEs from EHR notes [<xref ref-type="bibr" rid="ref65">65</xref>]. It consists of 1089 EHR notes of patients with cancer, from which data for 18 common Protected Health Information aspects were removed according to ﻿the Health Insurance Portability and Accountability Act. The dataset was separated into 876 notes for training and 213 notes for testing. In this dataset, the annotators annotated not only ADEs, but also other ADE-related information. They predefined 9 entity types, namely, Medication, Indication, Frequency, Severity, Dosage, Duration, Route, ADE, and SSLIF (any sign, symptom, and disease that is not an ADE or Indication). In addition, they predefined 7 relation types between these entity types, namely, ﻿Dosage-Medication, Route-Medication, Frequency-Medication, Duration-Medication, Medication-Indication, Medication-ADE, and Severity-ADE.</p>
        
        
                  <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>NER submodel. For simplicity, here we use “Renal Failure” to illustrate the architecture. For “Renal,” the word feature is “Renal,” the capital feature of the initial character is “R,” the POS feature is “JJ,” and the character representation is generated from CNN. NER: named entity recognition. CNN: convolutional neural network. CRF: condition random field. LSTM: long short-term memory. CNN: convolutional neural network. POS: part of speech.</p>
            </caption>
            <graphic xlink:href="medinform_v6i4e12159_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>RE submodel. The target entities are “renal failure” (e<sub>1</sub>) and “antibiotics” (e<sub>2</sub>). Positions represent token distances to the target entities. RE: relation extraction. LSTM: long short-term memory. POS: part of speech.</p>
          </caption>
          <graphic xlink:href="medinform_v6i4e12159_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The high-level view of HardMTL. For conciseness, “LSTM” indicates a BiLSTM layer, and the layers above the BiLSTM layer are denoted as <italic>D<sup>new</sup></italic> and <italic>D<sup>re</sup></italic>. The forward procedures for an NER instance and an RE instance are indicated by blue and green arrow lines, respectively. HardMTL: multi-task learning model for hard parameter sharing. LSTM: long short-term-memory. BiLSTM: bidirectional long short-term-memory. CRF: conditional random field. NER: named entity recognition. RE: relation extraction.</p>
          </caption>
          <graphic xlink:href="medinform_v6i4e12159_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The high-level view of RegMTL. <italic>LSTM<sub>1</sub><sup>ner</sup></italic> and <italic>LSTM<sub>2</sub><sup>ner</sup></italic> indicate the first and second BiLSTM layers of the NER model. <italic>LSTM<sub>1</sub><sup>re</sup></italic> and <italic>LSTM<sub>2</sub><sup>re</sup></italic> indicate the first and second BiLSTM layers of the RE model. NER: named entity recognition. RE: relation extraction. RegMTL: multi-task learning model for soft parameter sharing based on regularization. BiLSTM: bidirectional long short-term-memory. CRF: conditional random field. LSTM: long short-term-memory.</p>
          </caption>
          <graphic xlink:href="medinform_v6i4e12159_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>The high-level view of LearnMTL. LearnMTL: multi-task learning model for soft parameter sharing based on task-relation learning. CRF: conditional random field. LSTM: long short-term-memory.</p>
          </caption>
          <graphic xlink:href="medinform_v6i4e12159_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>The experimental settings used to obtain these results are provided in <xref ref-type="app" rid="app4">Multimedia Appendix 4</xref>.</p>
      <sec>
        <title>Comparison Between Our Best Model and Existing Systems</title>
        <p>We compared our models with the top three systems in the MADE1.0 challenge. Chapman et al [<xref ref-type="bibr" rid="ref66">66</xref>] used CRF for NER and random forest for RE. Specifically, two random forest models were used—one for detecting whether relations exist between entities and the other for classifying what specific relation type exists. Xu et al [<xref ref-type="bibr" rid="ref67">67</xref>] used BiLSTM-CRF for NER with word, prefix, suffix, and character features. For RE, they used SVM and designed features such as positions, distances, bag of words, and bag of entities. Dandala et al [<xref ref-type="bibr" rid="ref68">68</xref>] also used BiLSTM-CRF for NER, but they input different features into the model such as words, POS tags, and characters. For RE, they employed the BiLSTM-Attention model that takes tokens, entity types, and positions as input.</p>
        <p>Full neural systems ([<xref ref-type="bibr" rid="ref68">68</xref>] and our study) achieve better performances with the MADE dataset than with other systems (<xref ref-type="table" rid="table1">Table 1</xref>). Although the main methods between the study of Dandala et al [<xref ref-type="bibr" rid="ref68">68</xref>] and our study are similar, our model is much better, as it significantly improved the F1 for RE by 5%. The reasons for this superiority may be that we used more features than previous work, such as capital information and entity words, and our model attained approximately 0.8% improvement in F1 from MTL.</p>
      </sec>
      <sec>
        <title>Comparison Between the Pipeline and MTL Models</title>
        <p>The HardMTL model outperforms other models, achieving an F1 of 84.5% in NER and 66.7% in RE (<xref ref-type="table" rid="table2">Table 2</xref>); the pipeline model ranks second, with F1 values of 84.1% and 65.9%, respectively. The RegMTL model obtains the best recall in both NER (84.5%) and RE (63.6%). Surprisingly, the most-complex MTL model LearnMTL ranked last.</p>
        <p>In our experiments, HardMTL successfully boosted the NER F1 by 0.4% (<italic>P</italic>=.003) and the RE F1 by 0.8% (<italic>P</italic>=.01), but RegMTL and LearnMTL failed to boost the performances. Thus, the effectiveness of different MTL methods depends on the selected tasks and data. For heterogenous and loosely related tasks such as NER and RE, it is more difficult for MTL to be effective.</p>
      </sec>
      <sec>
        <title>Performance of Each Entity Type</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the performance of each entity type. Medication and Route (both F1&#62;90%) were easier to recognize than other types. In contrast, ADE is the most-difficult type to recognize (F1=55%). Other entity types with lower performances included Indication and Duration.</p>
      </sec>
      <sec>
        <title>Performance of Each Relation Type</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows the performance of each relation type. Medication-ADE relations are the most-difficult type to extract (F1=45.5%). Severity-ADE ranks second (F1=54.1%), followed by Duration-Medication (F1=59.5%). In contrast, Route-Medication and Dosage-Medication extraction are relatively easier, with F1&#62;80%.</p>
      </sec>
      <sec>
        <title>Comparison Between the Pipeline Model and MedEx System</title>
        <p>MedEx [<xref ref-type="bibr" rid="ref69">69</xref>] is an end-to-end system used to identify medications and their attributes such as routes and dosages. Therefore, the final results of MedEx correspond to our results for extracting 4 kinds of relations: Route-Medication, Dosage-Medication, Duration-Medication, Frequency-Medication. <xref ref-type="table" rid="table5">Table 5</xref> compares MedEx with our model. Our model significantly outperformed MedEx, which demonstrates that our model is a competitive system in this domain.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Comparison of our model with the existing systems in the Medication, Indication, and Adverse Drug Events dataset. The microaveraged F1s of relation extraction are shown according to the official evaluation report.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="300"/>
            <col width="300"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>System</td>
                <td>Named entity recognition</td>
                <td>Relation extraction</td>
                <td>F1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>Chapman et al [<xref ref-type="bibr" rid="ref66">66</xref>]</td>
                <td>CRF<sup>a</sup></td>
                <td>Random forest</td>
                <td>59.2</td>
              </tr>
              <tr valign="bottom">
                <td>Xu et al [<xref ref-type="bibr" rid="ref67">67</xref>]</td>
                <td>BiLSTM<sup>b</sup>-CRF</td>
                <td>Support vector machine</td>
                <td>59.9</td>
              </tr>
              <tr valign="bottom">
                <td>Dandala et al [<xref ref-type="bibr" rid="ref68">68</xref>]</td>
                <td>BiLSTM-CRF</td>
                <td>BiLSTM-Attention</td>
                <td>61.7</td>
              </tr>
              <tr valign="bottom">
                <td>Our Best (HardMTL<sup>c</sup>)</td>
                <td>BiLSTM-CRF</td>
                <td>BiLSTM-Attention</td>
                <td>66.7</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>CRF: conditional random field</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>BiLSTM: bidirectional long short-term memory</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>HardMTL: multi-task learning model for hard parameter sharing</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Performances (%) of the pipeline and multi-task learning models. The values presented are the means of 5 runs of each model. The microaveraged P, R, and F1s of all entity or relation types are shown.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="280"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Method</td>
                <td colspan="3">Entity recognition</td>
                <td colspan="3">Relation extraction</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>Pipeline</td>
                <td>85.0</td>
                <td>83.2</td>
                <td>84.1</td>
                <td>69.8</td>
                <td>62.4</td>
                <td>65.9</td>
              </tr>
              <tr valign="bottom">
                <td>HardMTL<sup>a</sup></td>
                <td>85.0</td>
                <td>84.1</td>
                <td>84.5</td>
                <td>70.2</td>
                <td>63.6</td>
                <td>66.7</td>
              </tr>
              <tr valign="bottom">
                <td>RegMTL<sup>b</sup></td>
                <td>84.5</td>
                <td>84.5</td>
                <td>84.5</td>
                <td>66.7</td>
                <td>63.6</td>
                <td>65.1</td>
              </tr>
              <tr valign="bottom">
                <td>LearnMTL<sup>c</sup></td>
                <td>84.5</td>
                <td>82.8</td>
                <td>83.6</td>
                <td>67.2</td>
                <td>61.5</td>
                <td>64.2</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>HardMTL: multi-task learning model for hard parameter sharing</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>RegMTL: multi-task learning model for soft parameter sharing based on regularization</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>LearnMTL: multi-task learning model for soft parameter sharing based on task relation learning</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Performance (%) of each entity type.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="250"/>
            <col width="250"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Entity type</td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Medication</td>
                <td>91.1</td>
                <td>92.0</td>
                <td>91.3</td>
              </tr>
              <tr valign="top">
                <td>Indication</td>
                <td>65.4</td>
                <td>64.8</td>
                <td>64.8</td>
              </tr>
              <tr valign="top">
                <td>Frequency</td>
                <td>87.1</td>
                <td>86.5</td>
                <td>86.3</td>
              </tr>
              <tr valign="top">
                <td>Severity</td>
                <td>84.6</td>
                <td>84.7</td>
                <td>84.7</td>
              </tr>
              <tr valign="top">
                <td>Dosage</td>
                <td>87.9</td>
                <td>86.4</td>
                <td>88.0</td>
              </tr>
              <tr valign="top">
                <td>Duration</td>
                <td>75.3</td>
                <td>76.6</td>
                <td>77.6</td>
              </tr>
              <tr valign="top">
                <td>Route</td>
                <td>91.6</td>
                <td>91.9</td>
                <td>91.9</td>
              </tr>
              <tr valign="top">
                <td>Adverse drug events</td>
                <td>59.5</td>
                <td>57.6</td>
                <td>55.4</td>
              </tr>
              <tr valign="bottom">
                <td>SSLIF<sup>a</sup></td>
                <td>83.9</td>
                <td>84.8</td>
                <td>84.9</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>SSLIF: any sign, symptom, and disease that is not an ADE or Indication</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Performance (%) of each relation type.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="250"/>
            <col width="250"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Relation type</td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Severity-Adverse drug events</td>
                <td>55.0</td>
                <td>54.4</td>
                <td>54.1</td>
              </tr>
              <tr valign="top">
                <td>Route-Medication</td>
                <td>81.0</td>
                <td>82.5</td>
                <td>82.1</td>
              </tr>
              <tr valign="top">
                <td>Medication-Indication</td>
                <td>53.9</td>
                <td>52.5</td>
                <td>52.9</td>
              </tr>
              <tr valign="top">
                <td>Dosage-Medication</td>
                <td>80.9</td>
                <td>79.8</td>
                <td>81.0</td>
              </tr>
              <tr valign="top">
                <td>Duration-Medication</td>
                <td>60.3</td>
                <td>63.7</td>
                <td>59.5</td>
              </tr>
              <tr valign="top">
                <td>Frequency-Medication</td>
                <td>77.7</td>
                <td>78.6</td>
                <td>78.4</td>
              </tr>
              <tr valign="top">
                <td>Medication-Adverse drug events</td>
                <td>50.4</td>
                <td>47.6</td>
                <td>45.5</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Results (%) of comparisons between our pipeline model and the MedEx system.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="280"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Entity type</td>
                <td colspan="3">MedEx system</td>
                <td colspan="3">Pipeline model</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
                <td>P</td>
                <td>R</td>
                <td>F1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Route-Medication</td>
                <td>71.9</td>
                <td>47.9</td>
                <td>57.5</td>
                <td>81.0</td>
                <td>82.5</td>
                <td>82.1</td>
              </tr>
              <tr valign="top">
                <td>Dosage-Medication</td>
                <td>29.7</td>
                <td>3.5</td>
                <td>6.2</td>
                <td>80.9</td>
                <td>79.8</td>
                <td>81.0</td>
              </tr>
              <tr valign="top">
                <td>Duration-Medication</td>
                <td>25.5</td>
                <td>15.6</td>
                <td>19.4</td>
                <td>60.3</td>
                <td>63.7</td>
                <td>59.5</td>
              </tr>
              <tr valign="top">
                <td>Frequency-Medication</td>
                <td>52.5</td>
                <td>36.2</td>
                <td>42.8</td>
                <td>77.7</td>
                <td>78.6</td>
                <td>78.4</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Existing systems usually selected a two-step pipeline to address ADE-related information extraction: recognizing entities and extracting relations. BiLSTM-CRF is the most-popular model for NER, whereas the selections of RE models are mixed. All our models outperformed the existing systems in the MADE1.0 challenge, which may be because of the following reasons: First, our models benefited from deep learning that is able to learn better from the data. Second, we enriched the features of deep learning models; therefore, our model outperformed the system [<xref ref-type="bibr" rid="ref68">68</xref>] that used similar deep learning models as ours.</p>
        <p>For MTL, we found that the model using hard parameter sharing (HardMTL) performed better than the other two models using soft parameter sharing (RegMTL and LearnMTL) and that the most complex MTL model, LearnMTL, performed the worst in our data. Our results are not surprising, as different MTL methods depend on different tasks and data [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref59">59</xref>]. Overall, MTL more difficult between heterogeneous and loosely related tasks such as NER and RE.</p>
        <p>In our experiments, the entity type “ADE” and relation type “Medication-ADE” were the most difficult information to be extracted. Based on our analysis, this is not only due to a lack of training data, but also the intrinsic character of ADEs. ADEs are often implicit in the context without any obvious pattern, which negatively affects the model (Example 1 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>). In contrast, some entity or relation types with obvious patterns (eg, Medication-Dosage) are easier to identify (Example 2 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>).</p>
        <p>Finally, we found that the performance improved when we used the pretrained word embeddings in the biomedical domain [<xref ref-type="bibr" rid="ref70">70</xref>] rather than those in the general domain. Furthermore, if the pretrained word embeddings were not tuned, our models would perform better. One likely reason for this is that such a method can alleviate the overfitting problem.</p>
      </sec>
      <sec>
        <title>Error Analysis</title>
        <p>We randomly sampled hundreds of error instances of NER and RE. Through the manual analyses, we found several sources of errors. For NER, the major false-negative errors are due to long expressions of entities (Examples 3 and 4 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>). These entities (eg, IgG kappa monoclonal protein) include multiple words; therefore, it is difficult to detect their boundaries. Moreover, the major false-positive errors for NER occur because some entity types are incorrectly recognized as SSLIF (Examples 5 and 6 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>). This may be because the training instances of SSLIF are ≥10 times those of other entity types such as ADE. Thus, imbalanced data distribution may lead to certain bias of our models.</p>
        <p>With respect to RE, the major false-negative errors are due to long distances between target entities (Example 9 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>). The relation of two entities can be expressed through ≥6 sentences in EHRs; therefore, our model may miss such relations in a long context. In addition, the major false-positive errors for RE occur because relation expressions exist in the instance, but are not related to the target entities (Examples 7 and 8 in <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>). For instance, in Example 7 of <xref ref-type="app" rid="app5">Multimedia Appendix 5</xref>, “His current therapy includes [thalidomide]<sub>Entity1</sub> 50 mg a day for 2 weeks out of the month. He had been on Velcade, which was stopped secondary to increasing [peripheral neuropathy]<sub><italic>Entity2</italic> </sub><italic>,</italic> ” “peripheral neuropathy,” and “thalidomide” have no Medication-ADE relation, but the model incorrectly predicts their relation due to the words “secondary to.”</p>
      </sec>
      <sec>
        <title>Contributions</title>
        <p>﻿</p>
        <p>The main contributions of this work are as follows: (1) We proposed an up-to-date deep learning model to perform ADE-related information extraction in an end-to-end manner. Our model achieved new state-of-the-art performance, improving the F1 by 4.2% (absolute value). (2) To our knowledge, this is the first attempt to investigate the impact of MTL on two heterogeneous and loosely related tasks (ie, NER and RE). One of our MTL models further improved the F1 by 0.8% (absolute value). (3) ﻿Our manually annotated dataset—Medication, Indication, and Adverse Drug Events (MADE) [<xref ref-type="bibr" rid="ref65">65</xref>]—will be publicly available to support the research on extraction of ADE-related information.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We proposed a deep learning model to detect ADEs and related information. We also investigated MTL on two ADE-related tasks, NER and RE. Our models achieved state-of-the-art performance in an ADE-detection dataset. MTL can improve performance, but it depends on the methods and data used. In the future, we plan to evaluate our models with more related datasets.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>BiLSTM-CRF submodel for NER. BiLSTM: bidirectional long short-term-memory. CRF: conditional random field. NER: named entity recognition.</p>
        <media xlink:href="medinform_v6i4e12159_app1.pdf" xlink:title="PDF File (Adobe PDF File), 75KB"/>
      </app>
      <app id="app2">
        <title>Multimedia Appendix 2</title>
        <p>BiLSTM-Attention submodel for RE. BiLSTM: bidirectional long short-term-memory. RE: relation extraction.</p>
        <media xlink:href="medinform_v6i4e12159_app2.pdf" xlink:title="PDF File (Adobe PDF File), 69KB"/>
      </app>
      <app id="app3">
        <title>Multimedia Appendix 3</title>
        <p>MTL models. MTL: multi-task learning.</p>
        <media xlink:href="medinform_v6i4e12159_app3.pdf" xlink:title="PDF File (Adobe PDF File), 181KB"/>
      </app>
      <app id="app4">
        <title>Multimedia Appendix 4</title>
        <p>Experimental settings.</p>
        <media xlink:href="medinform_v6i4e12159_app4.pdf" xlink:title="PDF File (Adobe PDF File), 73KB"/>
      </app>
      <app id="app5">
        <title>Multimedia Appendix 5</title>
        <p>Examples.</p>
        <media xlink:href="medinform_v6i4e12159_app5.pdf" xlink:title="PDF File (Adobe PDF File), 22KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb2">ADE</term>
          <def>
            <p>adverse drug event</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BiLSTM</term>
          <def>
            <p>bidirectional long short-term-memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CRF</term>
          <def>
            <p>conditional random field</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">FAERS</term>
          <def>
            <p>Food and Drug Administration Adverse Event Reporting System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">LSTM</term>
          <def>
            <p>long short-term-memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MADE</term>
          <def>
            <p>Medication, Indication, and Adverse Drug Events</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MTL</term>
          <def>
            <p>multi-task learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">RE</term>
          <def>
            <p>relation extraction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">POS</term>
          <def>
            <p>part of speech</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>﻿This work was supported by a grant (5R01HL125089) from the National Institutes of Health and the Investigator Initiated Research grant (1I01HX001457-01) from the Health Services Research &#38; Development Program of the US Department of Veterans Affairs.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bates</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Cullen</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Laird</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Petersen</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Small</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Servi</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Laffel</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Sweitzer</surname>
            <given-names>BJ</given-names>
          </name>
          <name name-style="western">
            <surname>Shea</surname>
            <given-names>BF</given-names>
          </name>
          <name name-style="western">
            <surname>Hallisey</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Incidence of adverse drug events and potential adverse drug events. Implications for prevention. ADE Prevention Study Group</article-title>
        <source>JAMA</source>  
        <year>1995</year>  
        <month>07</month>  
        <day>05</day>  
        <volume>274</volume>  
        <issue>1</issue>  
        <fpage>29</fpage>  
        <lpage>34</lpage>  
        <pub-id pub-id-type="medline">7791255</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nebeker</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Hoffman</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Weir</surname>
            <given-names>CR</given-names>
          </name>
          <name name-style="western">
            <surname>Bennett</surname>
            <given-names>CL</given-names>
          </name>
          <name name-style="western">
            <surname>Hurdle</surname>
            <given-names>JF</given-names>
          </name>
        </person-group>
        <article-title>High rates of adverse drug events in a highly computerized hospital</article-title>
        <source>Arch Intern Med</source>  
        <year>2005</year>  
        <month>05</month>  
        <day>23</day>  
        <volume>165</volume>  
        <issue>10</issue>  
        <fpage>1111</fpage>  
        <lpage>6</lpage>  
        <pub-id pub-id-type="doi">10.1001/archinte.165.10.1111</pub-id>
        <pub-id pub-id-type="medline">15911723</pub-id>
        <pub-id pub-id-type="pii">165/10/1111</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fattinger</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Roos</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Vergères</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Holenstein</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kind</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Masche</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Stocker</surname>
            <given-names>DN</given-names>
          </name>
          <name name-style="western">
            <surname>Braunschweig</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kullak-Ublick</surname>
            <given-names>GA</given-names>
          </name>
          <name name-style="western">
            <surname>Galeazzi</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Follath</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Gasser</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Meier</surname>
            <given-names>PJ</given-names>
          </name>
        </person-group>
        <article-title>Epidemiology of drug exposure and adverse drug reactions in two swiss departments of internal medicine</article-title>
        <source>Br J Clin Pharmacol</source>  
        <year>2000</year>  
        <month>02</month>  
        <volume>49</volume>  
        <issue>2</issue>  
        <fpage>158</fpage>  
        <lpage>67</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=0306-5251&#38;date=2000&#38;volume=49&#38;issue=2&#38;spage=158"/>
        </comment>  
        <pub-id pub-id-type="medline">10671911</pub-id>
        <pub-id pub-id-type="pii">bcp132</pub-id>
        <pub-id pub-id-type="pmcid">PMC2014906</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Classen</surname>
            <given-names>DC</given-names>
          </name>
          <name name-style="western">
            <surname>Pestotnik</surname>
            <given-names>SL</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Lloyd</surname>
            <given-names>JF</given-names>
          </name>
          <name name-style="western">
            <surname>Burke</surname>
            <given-names>JP</given-names>
          </name>
        </person-group>
        <article-title>Adverse drug events in hospitalized patients. Excess length of stay, extra costs, and attributable mortality</article-title>
        <source>JAMA</source>  
        <year>1997</year>  
        <volume>277</volume>  
        <issue>4</issue>  
        <fpage>301</fpage>  
        <lpage>6</lpage>  
        <pub-id pub-id-type="medline">9002492</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bates</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Spell</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Cullen</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Burdick</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Laird</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Petersen</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Small</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Sweitzer</surname>
            <given-names>BJ</given-names>
          </name>
          <name name-style="western">
            <surname>Leape</surname>
            <given-names>LL</given-names>
          </name>
        </person-group>
        <article-title>The costs of adverse drug events in hospitalized patients. Adverse Drug Events Prevention Study Group</article-title>
        <source>JAMA</source>  
        <year>1997</year>  
        <volume>277</volume>  
        <issue>4</issue>  
        <fpage>307</fpage>  
        <lpage>11</lpage>  
        <pub-id pub-id-type="medline">9002493</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Null</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Dean</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Feldman</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rasio</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Death by Medicine</article-title>
        <source>Journal of Orthomolecular Medicine</source>  
        <year>2005</year>  
        <volume>20</volume>  
        <issue>1</issue>  
        <fpage>34</fpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.orthomolecular.org/library/jom/2005/pdf/2005-v20n01-p021.pdf"/>
        </comment></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Makary</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Daniel</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Medical error-the third leading cause of death in the US</article-title>
        <source>BMJ</source>  
        <year>2016</year>  
        <month>12</month>  
        <day>03</day>  
        <pub-id pub-id-type="medline">27143499</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Handler</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Altman</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Perera</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Hanlon</surname>
            <given-names>JT</given-names>
          </name>
          <name name-style="western">
            <surname>Studenski</surname>
            <given-names>SA</given-names>
          </name>
          <name name-style="western">
            <surname>Bost</surname>
            <given-names>JE</given-names>
          </name>
          <name name-style="western">
            <surname>Saul</surname>
            <given-names>MI</given-names>
          </name>
          <name name-style="western">
            <surname>Fridsma</surname>
            <given-names>DB</given-names>
          </name>
        </person-group>
        <article-title>A systematic review of the performance characteristics of clinical event monitor signals used to detect adverse drug events in the hospital setting</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2007</year>  
        <volume>14</volume>  
        <issue>4</issue>  
        <fpage>451</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17460130"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1197/jamia.M2369</pub-id>
        <pub-id pub-id-type="medline">17460130</pub-id>
        <pub-id pub-id-type="pii">M2369</pub-id>
        <pub-id pub-id-type="pmcid">PMC2244905</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kaushal</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Jha</surname>
            <given-names>AK</given-names>
          </name>
          <name name-style="western">
            <surname>Franz</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Glaser</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Shetty</surname>
            <given-names>KD</given-names>
          </name>
          <name name-style="western">
            <surname>Jaggi</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Middleton</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Kuperman</surname>
            <given-names>GJ</given-names>
          </name>
          <name name-style="western">
            <surname>Khorasani</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Tanasijevic</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bates</surname>
            <given-names>DW</given-names>
          </name>
          <collab>BrighamWomen's Hospital CPOE Working Group</collab>
        </person-group>
        <article-title>Return on investment for a computerized physician order entry system</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2006</year>  
        <month>05</month>  
        <volume>13</volume>  
        <issue>3</issue>  
        <fpage>261</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16501178"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1197/jamia.M1984</pub-id>
        <pub-id pub-id-type="medline">16501178</pub-id>
        <pub-id pub-id-type="pii">M1984</pub-id>
        <pub-id pub-id-type="pmcid">PMC1513660</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Haas</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Iyer</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Orav</surname>
            <given-names>EJ</given-names>
          </name>
          <name name-style="western">
            <surname>Schiff</surname>
            <given-names>GD</given-names>
          </name>
          <name name-style="western">
            <surname>Bates</surname>
            <given-names>DW</given-names>
          </name>
        </person-group>
        <article-title>Participation in an ambulatory e-pharmacovigilance system</article-title>
        <source>Pharmacoepidemiol Drug Saf</source>  
        <year>2010</year>  
        <month>09</month>  
        <volume>19</volume>  
        <issue>9</issue>  
        <fpage>961</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1002/pds.2006</pub-id>
        <pub-id pub-id-type="medline">20623512</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Edlavitch</surname>
            <given-names>SA</given-names>
          </name>
        </person-group>
        <article-title>Adverse Drug Event Reporting</article-title>
        <source>Arch Intern Med</source>  
        <year>1988</year>  
        <month>07</month>  
        <day>01</day>  
        <volume>148</volume>  
        <issue>7</issue>  
        <fpage>1499</fpage>  
        <pub-id pub-id-type="doi">10.1001/archinte.1988.00380070017005</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Begaud</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Moride</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Tubert-Bitter</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Chaslerie</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Haramburu</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>False-positives in spontaneous reporting: should we worry about them?</article-title>
        <source>British Journal of Clinical Pharmacology</source>  
        <year>2012</year>  
        <month>07</month>  
        <day>05</day>  
        <volume>38</volume>  
        <issue>5</issue>  
        <fpage>401</fpage>  
        <lpage>404</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1365-2125.1994.tb04373.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
        <source>ProPublica</source>  
        <access-date>2018-10-28</access-date>
        <comment>Dollars for Docs 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://projects.propublica.org/docdollars/">https://projects.propublica.org/docdollars/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="73UddA54z"/></comment> </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kumar</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>The Newly Available FAERS Public Dashboard: Implications for Health Care Professionals</article-title>
        <source>Hospital Pharmacy</source>  
        <year>2018</year>  
        <month>08</month>  
        <day>23</day>  
        <pub-id pub-id-type="doi">10.1177/0018578718795271</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Peng</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Leaman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Davis</surname>
            <given-names>AP</given-names>
          </name>
          <name name-style="western">
            <surname>Mattingly</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wiegers</surname>
            <given-names>TC</given-names>
          </name>
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Assessing the state of the art in biomedical relation extraction: overview of the BioCreative V chemical-disease relation (CDR) task</article-title>
        <source>Database (Oxford)</source>  
        <year>2016</year>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26994911"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/database/baw032</pub-id>
        <pub-id pub-id-type="medline">26994911</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gurulingappa</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Rajput</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Fluck</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hofmann-Apitius</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Toldo</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Development of a benchmark corpus to support the automatic extraction of drug-related adverse effects from medical case reports</article-title>
        <source>J Biomed Inform</source>  
        <year>2012</year>  
        <month>10</month>  
        <volume>45</volume>  
        <issue>5</issue>  
        <fpage>885</fpage>  
        <lpage>92</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(12)00061-5"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2012.04.008</pub-id>
        <pub-id pub-id-type="medline">22554702</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(12)00061-5</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lardon</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Abdellaoui</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Bellet</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Asfari</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Souvignet</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Jaulent</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Beyens</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Burgun</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bousquet</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Adverse Drug Reaction Identification and Extraction in Social Media: A Scoping Review</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <month>07</month>  
        <day>10</day>  
        <volume>17</volume>  
        <issue>7</issue>  
        <fpage>e171</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2015/7/e171/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4304</pub-id>
        <pub-id pub-id-type="medline">26163365</pub-id>
        <pub-id pub-id-type="pii">v17i7e171</pub-id>
        <pub-id pub-id-type="pmcid">PMC4526988</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Abdellaoui</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Schück</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Burgun</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Filtering Entities to Optimize Identification of Adverse Drug Reaction From Social Media: How Can the Number of Words Between Entities in the Messages Help?</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2017</year>  
        <month>06</month>  
        <day>22</day>  
        <volume>3</volume>  
        <issue>2</issue>  
        <fpage>e36</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2017/2/e36/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.6577</pub-id>
        <pub-id pub-id-type="medline">28642212</pub-id>
        <pub-id pub-id-type="pii">v3i2e36</pub-id>
        <pub-id pub-id-type="pmcid">PMC5500778</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gurwitz</surname>
            <given-names>JH</given-names>
          </name>
        </person-group>
        <article-title>Incidence and Preventability of Adverse Drug Events Among Older Persons in the Ambulatory Setting</article-title>
        <source>JAMA</source>  
        <year>2003</year>  
        <month>03</month>  
        <day>05</day>  
        <volume>289</volume>  
        <issue>9</issue>  
        <fpage>1107</fpage>  
        <pub-id pub-id-type="doi">10.1001/jama.289.9.1107</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jagannatha</surname>
            <given-names>AN</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Bidirectional RNN for Medical Event Detection in Electronic Health Records</article-title>
        <source>Proc Conf</source>  
        <year>2016</year>  
        <month>06</month>  
        <volume>2016</volume>  
        <fpage>473</fpage>  
        <lpage>482</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27885364"/>
        </comment>  
        <pub-id pub-id-type="medline">27885364</pub-id>
        <pub-id pub-id-type="pmcid">PMC5119627</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Munkhdalai</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Clinical Relation Extraction Toward Drug Safety Surveillance Using Electronic Health Record Narratives: Classical Learning Versus Deep Learning</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2018</year>  
        <month>04</month>  
        <day>25</day>  
        <volume>4</volume>  
        <issue>2</issue>  
        <fpage>e29</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/2/e29/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.9361</pub-id>
        <pub-id pub-id-type="medline">29695376</pub-id>
        <pub-id pub-id-type="pii">v4i2e29</pub-id>
        <pub-id pub-id-type="pmcid">PMC5943628</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hurdle</surname>
            <given-names>JF</given-names>
          </name>
          <name name-style="western">
            <surname>Weir</surname>
            <given-names>CR</given-names>
          </name>
          <name name-style="western">
            <surname>Roth</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Hoffman</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Nebeker</surname>
            <given-names>JR</given-names>
          </name>
        </person-group>
        <article-title>Critical gaps in the world's largest electronic medical record: Ad Hoc nursing narratives and invisible adverse drug events</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2003</year>  
        <fpage>309</fpage>  
        <lpage>12</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728184"/>
        </comment>  
        <pub-id pub-id-type="medline">14728184</pub-id>
        <pub-id pub-id-type="pii">D030003423</pub-id>
        <pub-id pub-id-type="pmcid">PMC1480185</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>CD-REST: a system for extracting chemical-induced disease relation in literature</article-title>
        <source>Database (Oxford)</source>  
        <year>2016</year>  
        <month>05</month>  
        <day>25</day>  
        <pub-id pub-id-type="doi">10.1093/database/baw036</pub-id>
        <pub-id pub-id-type="medline">27016700</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Finkel</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Dingare</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Manning</surname>
            <given-names>CD</given-names>
          </name>
          <name name-style="western">
            <surname>Nissim</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Alex</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Grover</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Exploring the boundaries: gene and protein identification in biomedical text</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2005</year>  
        <volume>6 Suppl 1</volume>  
        <fpage>S5</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-6-S1-S5"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2105-6-S1-S5</pub-id>
        <pub-id pub-id-type="medline">15960839</pub-id>
        <pub-id pub-id-type="pii">1471-2105-6-S1-S5</pub-id>
        <pub-id pub-id-type="pmcid">PMC1869019</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lafferty</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>McCallum</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pereira</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Conditional Random Fields: Probabilistic Models for Segmenting and Labeling Sequence Data</article-title>
        <year>2001</year>  
        <conf-name>The Eighteenth International Conference on Machine Learning</conf-name>
        <conf-date>2001</conf-date>
        <conf-loc>San Francisco, CA, USA</conf-loc>
        <fpage>282</fpage>  
        <lpage>289</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://repository.upenn.edu/cgi/viewcontent.cgi?article=1162&#38;context=cis_papers"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Vapnik</surname>
            <given-names>VN</given-names>
          </name>
        </person-group>
        <source>The Nature of Statistical Learning Theory</source>  
        <year>2009</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>Springer-Verlag, LLC</publisher-name></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>LeCun</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Bengio</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Hinton</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Deep learning</article-title>
        <source>Nature</source>  
        <year>2015</year>  
        <month>05</month>  
        <day>28</day>  
        <volume>521</volume>  
        <issue>7553</issue>  
        <fpage>436</fpage>  
        <lpage>44</lpage>  
        <pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
        <pub-id pub-id-type="medline">26017442</pub-id>
        <pub-id pub-id-type="pii">nature14539</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rajkomar</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Oren</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Dai</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Hajaj</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Hardt</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>PJ</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Marcus</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sun</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Sundberg</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Yee</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Flores</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Duggan</surname>
            <given-names>GE</given-names>
          </name>
          <name name-style="western">
            <surname>Irvine</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Le</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Litsch</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Mossin</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Tansuwan</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Wexler</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wilson</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ludwig</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Volchenboum</surname>
            <given-names>SL</given-names>
          </name>
          <name name-style="western">
            <surname>Chou</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pearson</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Madabushi</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>NH</given-names>
          </name>
          <name name-style="western">
            <surname>Butte</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>Howell</surname>
            <given-names>MD</given-names>
          </name>
          <name name-style="western">
            <surname>Cui</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Corrado</surname>
            <given-names>GS</given-names>
          </name>
          <name name-style="western">
            <surname>Dean</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Scalable and accurate deep learning with electronic health records</article-title>
        <source>Nature</source>  
        <year>2018</year>  
        <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Caruana</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Multitask Learning</article-title>
        <source>Machine Learning</source>  
        <year>1997</year>  
        <month>07</month>  
        <volume>28</volume>  
        <issue>1</issue>  
        <fpage>41</fpage>  
        <lpage>75</lpage>  
        <pub-id pub-id-type="doi">10.1023/A:1007379606734</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Davis</surname>
            <given-names>AP</given-names>
          </name>
          <name name-style="western">
            <surname>Grondin</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Lennon-Hopkins</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Saraceni-Richards</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Sciaky</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>King</surname>
            <given-names>BL</given-names>
          </name>
          <name name-style="western">
            <surname>Wiegers</surname>
            <given-names>TC</given-names>
          </name>
          <name name-style="western">
            <surname>Mattingly</surname>
            <given-names>CJ</given-names>
          </name>
        </person-group>
        <article-title>The Comparative Toxicogenomics Database's 10th year anniversary: update 2015</article-title>
        <source>Nucleic Acids Res</source>  
        <year>2015</year>  
        <month>01</month>  
        <volume>43</volume>  
        <issue>Database issue</issue>  
        <fpage>D914</fpage>  
        <lpage>20</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25326323"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/nar/gku935</pub-id>
        <pub-id pub-id-type="medline">25326323</pub-id>
        <pub-id pub-id-type="pii">gku935</pub-id>
        <pub-id pub-id-type="pmcid">PMC4384013</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kuhn</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Campillos</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Letunic</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Jensen</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Bork</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>A side effect resource to capture phenotypic effects of drugs</article-title>
        <source>Mol Syst Biol</source>  
        <year>2010</year>  
        <volume>6</volume>  
        <fpage>343</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://MSB.embopress.org/cgi/pmidlookup?view=long&#38;pmid=20087340"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/msb.2009.98</pub-id>
        <pub-id pub-id-type="medline">20087340</pub-id>
        <pub-id pub-id-type="pii">msb200998</pub-id>
        <pub-id pub-id-type="pmcid">PMC2824526</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Polepalli</surname>
            <given-names>RB</given-names>
          </name>
          <name name-style="western">
            <surname>Belknap</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Frid</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>West</surname>
            <given-names>DP</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Automatically Recognizing Medication and Adverse Event Information From Food and Drug Administration's Adverse Event Reporting System Narratives</article-title>
        <source>JMIR Med Inform</source>  
        <year>2014</year>  
        <month>06</month>  
        <day>27</day>  
        <volume>2</volume>  
        <issue>1</issue>  
        <fpage>e10</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://medinform.jmir.org/2014/1/e10/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/medinform.3022</pub-id>
        <pub-id pub-id-type="medline">25600332</pub-id>
        <pub-id pub-id-type="pii">v2i1e10</pub-id>
        <pub-id pub-id-type="pmcid">PMC4288072</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Q</given-names>
          </name>
        </person-group>
        <article-title>Automatic construction of a large-scale and accurate drug-side-effect association knowledge base from biomedical literature</article-title>
        <source>J Biomed Inform</source>  
        <year>2014</year>  
        <month>10</month>  
        <volume>51</volume>  
        <fpage>191</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00138-5"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2014.05.013</pub-id>
        <pub-id pub-id-type="medline">24928448</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(14)00138-5</pub-id>
        <pub-id pub-id-type="pmcid">PMC4589180</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cai</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Matheny</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Sun</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Determining molecular predictors of adverse drug reactions with causality analysis based on structure learning</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <month>03</month>  
        <volume>21</volume>  
        <issue>2</issue>  
        <fpage>245</fpage>  
        <lpage>51</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24334612"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002051</pub-id>
        <pub-id pub-id-type="medline">24334612</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2013-002051</pub-id>
        <pub-id pub-id-type="pmcid">PMC3932464</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yildirim</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Majnarić</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ekmekci</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Holzinger</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Knowledge discovery of drug data on the example of adverse reaction prediction</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2014</year>  
        <volume>15 Suppl 6</volume>  
        <fpage>S7</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25079450"/>
        </comment>  
        <pub-id pub-id-type="medline">25079450</pub-id>
        <pub-id pub-id-type="pmcid">PMC4158658</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ohta</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Tateisi</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Tsujii</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>GENIA corpus--semantically annotated corpus for bio-textmining</article-title>
        <source>Bioinformatics</source>  
        <year>2003</year>  
        <volume>19 Suppl 1</volume>  
        <fpage>i180</fpage>  
        <lpage>2</lpage>  
        <pub-id pub-id-type="medline">12855455</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Doğan</surname>
            <given-names>RI</given-names>
          </name>
          <name name-style="western">
            <surname>Leaman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>NCBI disease corpus: a resource for disease name recognition and concept normalization</article-title>
        <source>J Biomed Inform</source>  
        <year>2014</year>  
        <month>02</month>  
        <volume>47</volume>  
        <fpage>1</fpage>  
        <lpage>10</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00197-4"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2013.12.006</pub-id>
        <pub-id pub-id-type="medline">24393765</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(13)00197-4</pub-id>
        <pub-id pub-id-type="pmcid">PMC3951655</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Suominen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Salanterä</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Velupillai</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Savova</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Elhadad</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Pradhan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>South</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Mowery</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Leveling</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kelly</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Goeuriot</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Martinez</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Zuccon</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Overview of the ShARe/CLEF eHealth Evaluation Lab</article-title>
        <year>2013</year>  
        <conf-name>International Conference of the Cross-Language Evaluation Forum for European Languages</conf-name>
        <conf-date>2013</conf-date>
        <conf-loc>Berlin</conf-loc>
        <pub-id pub-id-type="doi">10.1007/978-3-642-40802-1_24</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hanisch</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Fundel</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Mevissen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Zimmer</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Fluck</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>ProMiner: rule-based protein and gene entity recognition</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2005</year>  
        <volume>6 Suppl 1</volume>  
        <fpage>S14</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-6-S1-S14"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2105-6-S1-S14</pub-id>
        <pub-id pub-id-type="medline">15960826</pub-id>
        <pub-id pub-id-type="pii">1471-2105-6-S1-S14</pub-id>
        <pub-id pub-id-type="pmcid">PMC1869006</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Campos</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Matos</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Oliveira</surname>
            <given-names>JL</given-names>
          </name>
        </person-group>
        <article-title>Gimli: open source and high-performance biomedical name recognition</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2013</year>  
        <month>02</month>  
        <day>15</day>  
        <volume>14</volume>  
        <fpage>54</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-14-54"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2105-14-54</pub-id>
        <pub-id pub-id-type="medline">23413997</pub-id>
        <pub-id pub-id-type="pii">1471-2105-14-54</pub-id>
        <pub-id pub-id-type="pmcid">PMC3651325</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hsu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Chang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Kuo</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Chung</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <article-title>Integrating high dimensional bi-directional parsing models for gene mention tagging</article-title>
        <source>Bioinformatics</source>  
        <year>2008</year>  
        <month>07</month>  
        <day>01</day>  
        <volume>24</volume>  
        <issue>13</issue>  
        <fpage>i286</fpage>  
        <lpage>94</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18586726"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/bioinformatics/btn183</pub-id>
        <pub-id pub-id-type="medline">18586726</pub-id>
        <pub-id pub-id-type="pii">btn183</pub-id>
        <pub-id pub-id-type="pmcid">PMC2718659</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Su</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Shen</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Tan</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Recognizing names in biomedical texts: a machine learning approach</article-title>
        <source>Bioinformatics</source>  
        <year>2004</year>  
        <month>05</month>  
        <day>01</day>  
        <volume>20</volume>  
        <issue>7</issue>  
        <fpage>1178</fpage>  
        <lpage>90</lpage>  
        <pub-id pub-id-type="doi">10.1093/bioinformatics/bth060</pub-id>
        <pub-id pub-id-type="medline">14871877</pub-id>
        <pub-id pub-id-type="pii">bth060</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tang</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Recognizing Disjoint Clinical Concepts in Clinical Text Using Machine Learning-based Methods</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2015</year>  
        <volume>2015</volume>  
        <fpage>1184</fpage>  
        <lpage>93</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958258"/>
        </comment>  
        <pub-id pub-id-type="medline">26958258</pub-id>
        <pub-id pub-id-type="pmcid">PMC4765674</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lample</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Ballesteros</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Subramanian</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kawakami</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Dyer</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Neural Architectures for Named Entity Recognition</article-title>
        <year>2016</year>  
        <conf-name>the 2016 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
        <conf-date>2016</conf-date>
        <conf-loc>San Diego, California</conf-loc>
        <publisher-name>Association for Computational Linguistics</publisher-name>
        <pub-id pub-id-type="doi">10.18653/v1/N16-1030</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Design Challenges and Misconceptions in Neural Sequence Labeling</article-title>
        <year>2018</year>  
        <conf-name>Proceedings of the 27th International Conference on Computational Linguistics</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>Santa Fe, New Mexico, USA</conf-loc>
        <fpage>3879</fpage>  
        <lpage>3889</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://aclweb.org/anthology/C18-1327"/>
        </comment></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Uzuner</surname>
            <given-names>Ö</given-names>
          </name>
          <name name-style="western">
            <surname>South</surname>
            <given-names>BR</given-names>
          </name>
          <name name-style="western">
            <surname>Shen</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>DuVall</surname>
            <given-names>SL</given-names>
          </name>
        </person-group>
        <article-title>2010 i2b2/VA challenge on concepts, assertions, and relations in clinical text</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2011</year>  
        <volume>18</volume>  
        <issue>5</issue>  
        <fpage>552</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21685143"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000203</pub-id>
        <pub-id pub-id-type="medline">21685143</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2011-000203</pub-id>
        <pub-id pub-id-type="pmcid">PMC3168320</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fundel</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Küffner</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Zimmer</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>RelEx--relation extraction using dependency parse trees</article-title>
        <source>Bioinformatics</source>  
        <year>2007</year>  
        <month>02</month>  
        <day>01</day>  
        <volume>23</volume>  
        <issue>3</issue>  
        <fpage>365</fpage>  
        <lpage>71</lpage>  
        <pub-id pub-id-type="doi">10.1093/bioinformatics/btl616</pub-id>
        <pub-id pub-id-type="medline">17142812</pub-id>
        <pub-id pub-id-type="pii">btl616</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kilicoglu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Rosemblat</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Fiszman</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rindflesch</surname>
            <given-names>TC</given-names>
          </name>
        </person-group>
        <article-title>Sortal anaphora resolution to enhance relation extraction from biomedical literature</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2016</year>  
        <month>4</month>  
        <day>14</day>  
        <volume>17</volume>  
        <issue>1</issue>  
        <pub-id pub-id-type="doi">10.1186/s12859-016-1009-6</pub-id>
        <pub-id pub-id-type="medline">27080229</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lavergne</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Grouin</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Zweigenbaum</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>The contribution of co-reference resolution to supervised relation detection between bacteria and biotopes entities</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2015</year>  
        <volume>16 Suppl 10</volume>  
        <fpage>S6</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-16-S10-S6"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2105-16-S10-S6</pub-id>
        <pub-id pub-id-type="medline">26201352</pub-id>
        <pub-id pub-id-type="pii">1471-2105-16-S10-S6</pub-id>
        <pub-id pub-id-type="pmcid">PMC4511182</pub-id></nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Airola</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pyysalo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Björne</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pahikkala</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Ginter</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Salakoski</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>All-paths graph kernel for protein-protein interaction extraction with evaluation of cross-corpus learning</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2008</year>  
        <month>11</month>  
        <day>19</day>  
        <volume>9 Suppl 11</volume>  
        <fpage>S2</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-9-S11-S2"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2105-9-S11-S2</pub-id>
        <pub-id pub-id-type="medline">19025688</pub-id>
        <pub-id pub-id-type="pii">1471-2105-9-S11-S2</pub-id>
        <pub-id pub-id-type="pmcid">PMC2586751</pub-id></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kordjamshidi</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Roth</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Moens</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Structured learning for spatial information extraction from biomedical text: bacteria biotopes</article-title>
        <source>BMC Bioinformatics</source>  
        <year>2015</year>  
        <month>04</month>  
        <day>25</day>  
        <volume>16</volume>  
        <fpage>129</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-015-0542-z"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/s12859-015-0542-z</pub-id>
        <pub-id pub-id-type="medline">25909637</pub-id>
        <pub-id pub-id-type="pii">10.1186/s12859-015-0542-z</pub-id>
        <pub-id pub-id-type="pmcid">PMC4426185</pub-id></nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Luo</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Uzuner</surname>
            <given-names>Ö</given-names>
          </name>
          <name name-style="western">
            <surname>Szolovits</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Starren</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Segment convolutional neural networks (Seg-CNNs) for classifying relations in clinical notes</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2018</year>  
        <month>01</month>  
        <day>01</day>  
        <volume>25</volume>  
        <issue>1</issue>  
        <fpage>93</fpage>  
        <lpage>98</lpage>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocx090</pub-id>
        <pub-id pub-id-type="medline">29025149</pub-id>
        <pub-id pub-id-type="pii">4101223</pub-id></nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Verga</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Strubell</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>McCallum</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Simultaneously Self-Attending to All Mentions for Full-Abstract Biological Relation Extraction</article-title>
        <year>2018</year>  
        <conf-name>Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>New Orleans, Louisiana</conf-loc>
        <fpage>872</fpage>  
        <lpage>884</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://aclweb.org/anthology/N18-1080"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Miwa</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bansal</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>End-to-end Relation Extraction using LSTMs on Sequences and Tree Structures</article-title>
        <year>2016</year>  
        <conf-name>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics</conf-name>
        <conf-date>2016</conf-date>
        <conf-loc>Berlin, Germany</conf-loc>
        <fpage>1105</fpage>  
        <lpage>1116</lpage>  
        <pub-id pub-id-type="doi">10.18653/v1/P16-1105</pub-id></nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mehryary</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Hakala</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kaewphan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Björne</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Salakoski</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Ginter</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>End-to-End System for Bacteria Habitat Extraction</article-title>
        <year>2017</year>  
        <conf-name>BioNLP</conf-name>
        <conf-date>2017</conf-date>
        <conf-loc>Vancouver, Canada</conf-loc>
        <fpage>80</fpage>  
        <lpage>90</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/W17-2310"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Misra</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Shrivastava</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gupta</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Hebert</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Cross-Stitch Networks for Multi-task Learning</article-title>
        <year>2016</year>  
        <conf-name>IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>
        <conf-date>2016</conf-date>
        <conf-loc>Las Vegas, Nevada</conf-loc>
        <fpage>3994</fpage>  
        <lpage>4003</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://openaccess.thecvf.com/content_cvpr_2016/papers/Misra_Cross-Stitch_Networks_for_CVPR_2016_paper.pdf"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1109/CVPR.2016.433</pub-id></nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Collobert</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Weston</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Bottou</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Karlen</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kavukcuoglu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kuksa</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Natural language processing (almost) from scratch</article-title>
        <source>The Journal of Machine Learning Research</source>  
        <year>2011</year>  
        <volume>12</volume>  
        <fpage>2537</fpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume12/collobert11a/collobert11a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ruder</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>arXiv</source>  
        <year>2017</year>  
        <access-date>2018-11-15</access-date>
        <comment>An Overview of Multi-Task Learning in Deep Neural Networks 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1706.05098">https://arxiv.org/abs/1706.05098</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="73wxJmB0m"/></comment> </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Duong</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Cohn</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Bird</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Low Resource Dependency Parsing: Cross-lingual Parameter Sharing in a Neural Network Parser</article-title>
        <year>2015</year>  
        <conf-name>Proceedings of the 53rd Annual Meeting of the Association for Computational Linguistics</conf-name>
        <conf-date>2015</conf-date>
        <conf-loc>Beijing, China</conf-loc>
        <fpage>845</fpage>  
        <lpage>850</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://anthology.aclweb.org/P/P15/P15-2139.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Argyriou</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Evgeniou</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Pontil</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Multi-task Feature Learning</article-title>
        <year>2006</year>  
        <conf-name>Proceedings of the 19th International Conference on Neural Information Processing Systems</conf-name>
        <conf-date>2006</conf-date>
        <conf-loc>Cambridge, MA</conf-loc>
        <fpage>41</fpage>  
        <lpage>48</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://papers.nips.cc/paper/3143-multi-task-feature-learning.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hochreiter</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Schmidhuber</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Long Short-Term Memory</article-title>
        <source>Neural Computation</source>  
        <year>1997</year>  
        <month>11</month>  
        <volume>9</volume>  
        <issue>8</issue>  
        <fpage>1735</fpage>  
        <lpage>1780</lpage>  
        <pub-id pub-id-type="doi">10.1162/neco.1997.9.8.1735</pub-id></nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Luong</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Pham</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Manning</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Effective Approaches to Attention-based Neural Machine Translation</article-title>
        <year>2015</year>  
        <conf-name>Proceedings of the Conference on Empirical Methods in Natural Language Processing</conf-name>
        <conf-date>2015</conf-date>
        <conf-loc>Lisbon, Portugal</conf-loc>
        <fpage>1412</fpage>  
        <lpage>1421</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://aclweb.org/anthology/D15-1166"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Lai</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Relation Classification via Convolutional Deep Neural Network</article-title>
        <year>2014</year>  
        <conf-name>Proceedings of the 25th International Conference on Computational Linguistics</conf-name>
        <conf-date>2014</conf-date>
        <conf-loc>Dublin, Ireland</conf-loc>
        <fpage>2335</fpage>  
        <lpage>2344</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/C14-1220"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Cardie</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Multinomial Adversarial Networks for Multi-Domain Text Classification</article-title>
        <year>2018</year>  
        <conf-name>Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>New Orleans, Louisiana</conf-loc>
        <fpage>1226</fpage>  
        <lpage>1240</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/N18-1111"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jagannatha</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Overview of the First Natural Language Processing Challenge for Extracting Medication, Indication and Adverse Drug Events from Electronic Health Record Notes (MADE1.0)</article-title>
        <source>Drug Safety</source>  
        <year>2018</year>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://bio-nlp.org/index.php/announcements/39-nlp-challenges"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Peterson</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Alba</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>DuVall</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Patterson</surname>
            <given-names>O</given-names>
          </name>
        </person-group>
        <article-title>Hybrid system for adverse drug event detection</article-title>
        <year>2018</year>  
        <conf-name>International Workshop on Medication and Adverse Drug Event Detection</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>Worcester, MA, United States</conf-loc>
        <fpage>16</fpage>  
        <lpage>24</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://proceedings.mlr.press/v90/chapman18a/chapman18a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Yadav</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Bethard</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>UArizona at the MADE1.0 NLP Challenge</article-title>
        <year>2018</year>  
        <conf-name>International Workshop on Medication and Adverse Drug Event Detection</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>Worcester, MA, United States</conf-loc>
        <fpage>57</fpage>  
        <lpage>65</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://proceedings.mlr.press/v90/xu18a/xu18a.pdf"/>
        </comment></nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dandala</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Joopudi</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Devarakonda</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>IBM Research System at MADE 2018: Detecting Adverse Drug Events from Electronic Health Records</article-title>
        <year>2018</year>  
        <conf-name>International Workshop on Medication and Adverse Drug Event Detection</conf-name>
        <conf-date>2018</conf-date>
        <conf-loc>Worcester, MA, United States</conf-loc>
        <fpage>39</fpage>  
        <lpage>47</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://proceedings.mlr.press/v90/dandala18a/dandala18a.pdf"/>
        </comment></nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Stenner</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Doan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Johnson</surname>
            <given-names>KB</given-names>
          </name>
          <name name-style="western">
            <surname>Waitman</surname>
            <given-names>LR</given-names>
          </name>
          <name name-style="western">
            <surname>Denny</surname>
            <given-names>JC</given-names>
          </name>
        </person-group>
        <article-title>MedEx: a medication information extraction system for clinical narratives</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2010</year>  
        <volume>17</volume>  
        <issue>1</issue>  
        <fpage>19</fpage>  
        <lpage>24</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=20064797"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1197/jamia.M3378</pub-id>
        <pub-id pub-id-type="medline">20064797</pub-id>
        <pub-id pub-id-type="pii">17/1/19</pub-id>
        <pub-id pub-id-type="pmcid">PMC2995636</pub-id></nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pyysalo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ginter</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Moen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Salakoski</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Ananiadou</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Distributional semantics resources for biomedical text processing</article-title>
        <year>2013</year>  
        <conf-name>the 5th International Symposium on Languages in Biology and Medicine</conf-name>
        <conf-date>2013</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>39</fpage>  
        <lpage>43</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://bio.nlplab.org/pdf/pyysalo13literature.pdf"/>
        </comment> </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
