<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i7e18417</article-id>
      <article-id pub-id-type="pmid">32459650</article-id>
      <article-id pub-id-type="doi">10.2196/18417</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Extraction of Information Related to Drug Safety Surveillance From Electronic Health Record Notes: Joint Modeling of Entities and Relations Using Knowledge-Aware Neural Attentive Models</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Muto</surname>
            <given-names>Tomoyasu </given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Doan</surname>
            <given-names>Son</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Dandala</surname>
            <given-names>Bharath</given-names>
          </name>
          <degrees>BTECH, MS, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>IBM Research</institution>
            <addr-line>1101 Kitchawan Rd</addr-line>
            <addr-line>Yorktown Heights, NY, 10598</addr-line>
            <country>United States</country>
            <phone>1 9403673972</phone>
            <email>bdand@us.ibm.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9643-991X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Joopudi</surname>
            <given-names>Venkata</given-names>
          </name>
          <degrees>BTECH, MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8426-3219</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Tsou</surname>
            <given-names>Ching-Huei</given-names>
          </name>
          <degrees>BS, MEng, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1273-5904</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>Jennifer J</given-names>
          </name>
          <degrees>SB, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5197-1590</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Suryanarayanan</surname>
            <given-names>Parthasarathy</given-names>
          </name>
          <degrees>BSc, BTECH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8619-2976</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>IBM Research</institution>
        <addr-line>Yorktown Heights, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Bharath Dandala <email>bdand@us.ibm.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>10</day>
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>7</issue>
      <elocation-id>e18417</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>28</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>5</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Bharath Dandala, Venkata Joopudi, Ching-Huei Tsou, Jennifer J Liang, Parthasarathy Suryanarayanan. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 10.07.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2020/7/e18417" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>An adverse drug event (ADE) is commonly defined as “an injury resulting from medical intervention related to a drug.” Providing information related to ADEs and alerting caregivers at the point of care can reduce the risk of prescription and diagnostic errors and improve health outcomes. ADEs captured in structured data in electronic health records (EHRs) as either coded problems or allergies are often incomplete, leading to underreporting. Therefore, it is important to develop capabilities to process unstructured EHR data in the form of clinical notes, which contain a richer documentation of a patient’s ADE. Several natural language processing (NLP) systems have been proposed to automatically extract information related to ADEs. However, the results from these systems showed that significant improvement is still required for the automatic extraction of ADEs from clinical notes.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to improve the automatic extraction of ADEs and related information such as drugs, their attributes, and reason for administration from the clinical notes of patients.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This research was conducted using discharge summaries from the Medical Information Mart for Intensive Care III (MIMIC-III) database obtained through the 2018 National NLP Clinical Challenges (n2c2) annotated with drugs, drug attributes (ie, strength, form, frequency, route, dosage, duration), ADEs, reasons, and relations between drugs and other entities. We developed a deep learning–based system for extracting these drug-centric concepts and relations simultaneously using a joint method enhanced with contextualized embeddings, a position-attention mechanism, and knowledge representations. The joint method generated different sentence representations for each drug, which were then used to extract related concepts and relations simultaneously. Contextualized representations trained on the MIMIC-III database were used to capture context-sensitive meanings of words. The position-attention mechanism amplified the benefits of the joint method by generating sentence representations that capture long-distance relations. Knowledge representations were obtained from graph embeddings created using the US Food and Drug Administration Adverse Event Reporting System database to improve relation extraction, especially when contextual clues were insufficient.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our system achieved new state-of-the-art results on the n2c2 data set, with significant improvements in recognizing crucial drug−reason (F1=0.650 versus F1=0.579) and drug−ADE (F1=0.490 versus F1=0.476) relations.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study presents a system for extracting drug-centric concepts and relations that outperformed current state-of-the-art results and shows that contextualized embeddings, position-attention mechanisms, and knowledge graph embeddings effectively improve deep learning–based concepts and relation extraction. This study demonstrates the potential for deep learning–based methods to help extract real-world evidence from unstructured patient data for drug safety surveillance.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>electronic health records</kwd>
        <kwd>adverse drug events</kwd>
        <kwd>natural language processing</kwd>
        <kwd>deep learning</kwd>
        <kwd>information extraction</kwd>
        <kwd>adverse drug reaction reporting systems</kwd>
        <kwd>named entity recognition</kwd>
        <kwd>relation extraction</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>An electronic health record (EHR) is the systematized collection of electronically stored health information of patients and the general population in a digital format [<xref ref-type="bibr" rid="ref1">1</xref>]. Clinical notes in EHRs summarize interactions that occur between patients and health care providers [<xref ref-type="bibr" rid="ref2">2</xref>]. These notes include observations, impressions, treatments, drug use, adverse drug events (ADEs), and other activities arising from each interaction between the patient and the health care system. Extracting useful information such as ADEs from these notes and alerting caregivers at the point of care has the potential to improve patient health outcomes.</p>
        <p>An ADE is commonly defined as “an injury resulting from medical intervention related to a drug” [<xref ref-type="bibr" rid="ref3">3</xref>]. ADEs are a major public health concern and one of the leading causes of morbidity and mortality [<xref ref-type="bibr" rid="ref4">4</xref>]. Studies have shown the substantial economic burden of these undesired effects [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Although drug safety and efficacy are tested during premarketing randomized clinical trials, these trials may not detect all ADEs because such studies are often small, short, and biased by the exclusion of patients with comorbid diseases. With the limited information available when a drug is marketed, postmarketing surveillance has become increasingly important. Spontaneous reporting systems, such as the US Food and Drug Administration Adverse Event Reporting System (FAERS) [<xref ref-type="bibr" rid="ref7">7</xref>], are monitoring mechanisms for postmarketing surveillance that enable both physicians and patients to report ADEs. However, previous studies [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>] have exposed various inadequacies with such systems, including underreporting, reporting biases, and incomplete information, prompting researchers to explore additional sources to detect ADEs from real-world data.</p>
        <p>Several efforts have been made to extract ADEs automatically from disparate information sources, including EHRs [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>], spontaneous reporting systems [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], social media [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>], search queries on the web via search engine logs [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], and biology and chemistry knowledge bases [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. Furthermore, the clinical natural language processing (NLP) community has organized several open challenges such as the 2010 Informatics for Integrating Biology &#38; the Bedside/Veterans Affairs NLP Challenge [<xref ref-type="bibr" rid="ref26">26</xref>], Text Analysis Conference 2017 Adverse Drug Reactions Track [<xref ref-type="bibr" rid="ref27">27</xref>], and BioCreative V Chemical Disease Relation task [<xref ref-type="bibr" rid="ref28">28</xref>]. Recently, 2 such challenges, Medication and Adverse Drug Events from Electronic Health Records (MADE 1.0) [<xref ref-type="bibr" rid="ref29">29</xref>] and the 2018 National NLP Clinical Challenges (n2c2) Shared Task Track 2 [<xref ref-type="bibr" rid="ref30">30</xref>], were organized to extract <italic>drugs</italic>, drug attributes, <italic>ADEs</italic>, <italic>reasons</italic> for prescribing drugs, and their relations from clinical notes. The results from these 2 challenges showed that deep learning techniques outperform traditional machine learning techniques for this task, and significant improvement is still required for <italic>drug−{ADE, reason}</italic> relation extraction. Specifically, the organizers of these challenges hypothesized that models that can effectively incorporate the larger context to capture long-distance relations or leverage knowledge to capture implicit relations will likely improve the performance of future systems.</p>
        <p>Considering these conclusions, we developed a joint deep learning–based relation extraction system that helps in extracting long-distance relations through a position-attention mechanism and implicit relations through external knowledge from the FAERS. To the best of our knowledge, no previous research has been conducted on using the position-attention mechanism and domain-specific knowledge graph embeddings in ADE detection.</p>
      </sec>
      <sec>
        <title>Relevant Literature</title>
        <sec>
          <title>Adverse Drug Event Detection</title>
          <p>From the viewpoint of NLP, effective techniques for entity and relation extraction are fundamental requirements in automatic ADE extraction. Entity and relation extraction from text has traditionally been treated as a pipeline of 2 separate subtasks: named entity recognition (NER) and relation classification. Previous studies employed traditional machine learning techniques [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref34">34</xref>], such as conditional random fields (CRF) [<xref ref-type="bibr" rid="ref35">35</xref>] for NER and support vector machines [<xref ref-type="bibr" rid="ref36">36</xref>] for relation classification. Several recent approaches [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref44">44</xref>], developed on MADE 1.0 [<xref ref-type="bibr" rid="ref29">29</xref>] and 2018 n2c2 Shared Task Track 2 [<xref ref-type="bibr" rid="ref30">30</xref>] data sets, employed deep learning techniques, such as bidirectional, long short-term memory–conditional random fields (BiLSTM-CRFs) [<xref ref-type="bibr" rid="ref45">45</xref>], for NER and convolutional neural network (CNN) [<xref ref-type="bibr" rid="ref46">46</xref>] for relation classification, and showed numerous advantages resulting in better performance and less feature engineering. However, there is an inevitable error propagation issue with pipeline-based methods because of the following:</p>
          <list list-type="order">
            <list-item>
              <p>NER relying on sequence-labeling techniques suffers from lossy representation when there are overlapping annotations on entities. For example, in “she was on <italic>furosemide</italic> and became <italic>hypotensive</italic> requiring <italic>norepinephrine</italic>,” <italic>hypotensive</italic> is an <italic>ADE</italic> with respect to <italic>furosemide</italic> but a <italic>reason</italic> with respect to <italic>norepinephrine</italic>.</p>
            </list-item>
            <list-item>
              <p>NER approaches usually take an input context window that may not contain the necessary information to determine the appropriate label (ie, <italic>ADE, reason,</italic> no label). For example, in “Patient reports <italic>nausea</italic>. Started on <italic>ondansetron,</italic>” the identification of <italic>nausea</italic> as a <italic>reason</italic> requires information from both sentences.</p>
            </list-item>
            <list-item>
              <p>Signs or symptoms are only labeled as <italic>ADE</italic> or <italic>reason</italic> if they are related to a drug (ie, not all signs or symptoms in the clinical note are annotated). This makes the corpus less suitable to train an effective relation classification model as it misses negative candidate pairs for <italic>drug</italic>−{<italic>ADE, reason</italic>} relations.</p>
            </list-item>
          </list>
          <p>To address the first 2 issues, we previously proposed a joint method that outperformed the pipeline method for concept and relation extraction on a similar data set (MADE 1.0) [<xref ref-type="bibr" rid="ref37">37</xref>]. In a separate study, Li et al [<xref ref-type="bibr" rid="ref47">47</xref>] proposed a joint method using multitask learning [<xref ref-type="bibr" rid="ref48">48</xref>] and made similar observations. To address the third issue, which was introduced with the n2c2 data set, Wei et al [<xref ref-type="bibr" rid="ref38">38</xref>] proposed a novel label-encoding scheme to jointly extract <italic>ADE</italic>, <italic>reason</italic>, drug attributes, and their relations.</p>
        </sec>
        <sec>
          <title>Attention-Based Relation Extraction</title>
          <p>The attention mechanism allows neural networks to selectively focus on specific information [<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>]. This has proven to be effective for NLP problems with long-distance dependencies such as NER and relation extraction. Zhou et al [<xref ref-type="bibr" rid="ref52">52</xref>] proposed an attention-based BiLSTM network and demonstrated its effectiveness in selectively focusing on words that have decisive effects on relation classification. Next, Zhang et al [<xref ref-type="bibr" rid="ref53">53</xref>] extended the attention mechanism to help networks not only focus on words based on the semantic information of the sentence but also the global positions of entities within the sentence. Recently Dai et al [<xref ref-type="bibr" rid="ref54">54</xref>] introduced a position-attention mechanism for joint extraction of entities and overlapping relations. The position-attention mechanism builds on self-attention by focusing on both the global dependencies of the input and tokens of the target entities of interest for relation extraction. Recent research [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] on ADE extraction showed the benefits of self-attention mechanisms in pipeline-based methods, specifically for relation classification. However, to the best of our knowledge, no previous work has focused on using self-attention or position-attention mechanisms for joint extraction of entities and relations for ADE extraction.</p>
        </sec>
        <sec>
          <title>Knowledge-Aware Relation Extraction</title>
          <p>Several approaches [<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref59">59</xref>] in the open domain have shown that incorporating embeddings learned from knowledge bases benefit deep learning–based relation classification. These embeddings are typically learned using translation-based methods such as TransE [<xref ref-type="bibr" rid="ref60">60</xref>], TransH [<xref ref-type="bibr" rid="ref61">61</xref>], and TransR [<xref ref-type="bibr" rid="ref62">62</xref>]; walk-based methods such as DeepWalk [<xref ref-type="bibr" rid="ref63">63</xref>] and node2vec [<xref ref-type="bibr" rid="ref64">64</xref>]; or neural network–based methods such as large-scale information network embedding (LINE) [<xref ref-type="bibr" rid="ref65">65</xref>] and bipartite network embedding [<xref ref-type="bibr" rid="ref66">66</xref>].</p>
          <p>Clinical notes are typically written for medical professionals. Hence, a certain degree of medical knowledge is assumed by the authors, which is not explicitly expressed in the text. This is especially true for relations between clinical findings and drugs, where a drug could either cause (<italic>ADE</italic>) or treat (<italic>reason</italic>) a clinical finding. In our previous study [<xref ref-type="bibr" rid="ref37">37</xref>], we showed that augmenting knowledge base features such as proportional report ratio and reporting odds ratio calculated from the FAERS into deep learning models can benefit relation classification. Recently, Chen et al [<xref ref-type="bibr" rid="ref67">67</xref>] proposed a hybrid clinical NLP system by combining a general knowledge-based system using the Unified Medical Language System (UMLS) and BiLSTM-CRF for concept extraction and attention-BiLSTM for relation classification. However, to the best of our knowledge, no previous work has focused on using knowledge graph embeddings generated from the FAERS for joint extraction of entities and relations for ADE extraction.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Set</title>
        <p>The n2c2 data set consists of 505 deidentified clinical narratives, of which 303 and 202 narratives were released as train and test data sets, respectively. Each narrative was manually annotated with drug-centric entities, including <italic>drugs</italic>, their attributes (<italic>strength</italic>, <italic>form</italic>, <italic>frequency</italic>, <italic>route</italic>, <italic>dosage</italic>, and <italic>duration</italic>), <italic>ADEs</italic>, <italic>reasons</italic>, and relations between drugs and other entities (<italic>drug−</italic>{attributes, <italic>ADE</italic>, <italic>reason</italic>}). <italic>Drug−</italic>{attributes} represent 6 different types of relations: <italic>drug−</italic>{<italic>strength</italic>, <italic>form</italic>, <italic>frequency</italic>, <italic>route</italic>, <italic>dosage</italic>, <italic>duration</italic>}. <xref rid="figure1" ref-type="fig">Figure 1</xref> presents an example with annotations. <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref> present the statistical overview of the annotated entities and relations.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>An illustration with annotations for entities and relations. ADE: adverse drug event; HTN: hypertension; QHS: every night at bedtime.</p>
          </caption>
          <graphic xlink:href="medinform_v8i7e18417_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Entities in the data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="130"/>
            <col width="130"/>
            <col width="110"/>
            <col width="540"/>
            <thead>
              <tr valign="top">
                <td>Entity type</td>
                <td colspan="2">Number of annotations</td>
                <td>Example</td>
                <td>Description</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Train, n (%)</td>
                <td>Test, n (%)</td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Drug</td>
                <td>16,225 (31.84)</td>
                <td>10,575 (32.13)</td>
                <td>Coumadin</td>
                <td>Name of the drug</td>
              </tr>
              <tr valign="top">
                <td>Strength</td>
                <td>6691 (13.13)</td>
                <td>4230 (12.85)</td>
                <td>5 mg</td>
                <td>Strength of the drug</td>
              </tr>
              <tr valign="top">
                <td>Form</td>
                <td>6651 (13.05)</td>
                <td>4359 (13.24)</td>
                <td>Tablet</td>
                <td>Form of the drug</td>
              </tr>
              <tr valign="top">
                <td>Frequency</td>
                <td>6281 (12.32)</td>
                <td>4012 (12.19)</td>
                <td>Daily</td>
                <td>Frequency of the drug</td>
              </tr>
              <tr valign="top">
                <td>Route</td>
                <td>5476 (10.75)</td>
                <td>3513 (10.67)</td>
                <td>By mouth</td>
                <td>Route in which the drug is administered</td>
              </tr>
              <tr valign="top">
                <td>Dosage</td>
                <td>4221 (8.28)</td>
                <td>2681 (8.14)</td>
                <td>1</td>
                <td>Dosage of the drug</td>
              </tr>
              <tr valign="top">
                <td>Duration</td>
                <td>592 (1.16)</td>
                <td>378 (1.15)</td>
                <td>For 5 days</td>
                <td>Duration of the drug</td>
              </tr>
              <tr valign="top">
                <td>ADE<sup>a</sup></td>
                <td>959 (1.88)</td>
                <td>625 (1.90)</td>
                <td>Rash</td>
                <td>Adverse reaction of the drug</td>
              </tr>
              <tr valign="top">
                <td>Reason</td>
                <td>3855 (7.57)</td>
                <td>2545 (7.73)</td>
                <td>Constipation</td>
                <td>Indication if it is an affliction that a physician is actively treating with a drug</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>50,951 (100.00)</td>
                <td>32,918 (100.00)</td>
                <td>N/A<sup>b</sup></td>
                <td>N/A</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>ADE: adverse drug event.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Relations in the data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="480"/>
            <thead>
              <tr valign="top">
                <td>Relation type</td>
                <td colspan="2">Relations</td>
                <td colspan="2">Intersentential relations</td>
                <td>Example<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Train, n (%)</td>
                <td>Test, n (%)</td>
                <td>Train, n (%)</td>
                <td>Test, n (%)</td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Drug−strength</td>
                <td>6702 (18.44)</td>
                <td>4244 (18.09)</td>
                <td>80 (1.19)</td>
                <td>59 (1.39)</td>
                <td><italic>Lisinopril</italic> 1×<italic>5 mg</italic> tablet orally daily for 7 days</td>
              </tr>
              <tr valign="top">
                <td>Drug−form</td>
                <td>6654 (18.31)</td>
                <td>4374 (18.64)</td>
                <td>259 (3.89)</td>
                <td>144 (3.29)</td>
                <td><italic>Lisinopril</italic> 1×5 mg <italic>tablet</italic> orally daily for 7 days</td>
              </tr>
              <tr valign="top">
                <td>Drug−frequency</td>
                <td>6310 (17.36)</td>
                <td>4034 (17.19)</td>
                <td>372 (5.90)</td>
                <td>238 (5.90)</td>
                <td><italic>Lisinopril</italic> 1×5 mg tablet orally <italic>daily</italic> for 7 days</td>
              </tr>
              <tr valign="top">
                <td>Drug−route</td>
                <td>5538 (15.24)</td>
                <td>3546 (15.11)</td>
                <td>199 (3.59)</td>
                <td>149 (4.20)</td>
                <td><italic>Lisinopril</italic> 1×5 mg tablet <italic>orally</italic> daily for 7 days</td>
              </tr>
              <tr valign="top">
                <td>Drug−dosage</td>
                <td>4225 (11.62)</td>
                <td>2695 (11.49)</td>
                <td>135 (3.20)</td>
                <td>102 (3.78)</td>
                <td><italic>Lisinopril</italic><italic>1</italic>×5 mg tablet orally daily for 7 days</td>
              </tr>
              <tr valign="top">
                <td>Drug−duration</td>
                <td>643 (1.80)</td>
                <td>426 (1.80)</td>
                <td>34 (5.4)</td>
                <td>43 (10.0)</td>
                <td><italic>Lisinopril</italic> 1×5 mg tablet orally daily for <italic>7 days</italic></td>
              </tr>
              <tr valign="top">
                <td>Drug−ADE<sup>b</sup></td>
                <td>1107 (3.05)</td>
                <td>733 (3.10)</td>
                <td>254 (22.94)</td>
                <td>139 (18.9)</td>
                <td>Patient is experiencing <italic>muscle pain</italic>, secondary to <italic>statin</italic> therapy for coronary artery disease</td>
              </tr>
              <tr valign="top">
                <td>Drug−reason</td>
                <td>5169 (14.22)</td>
                <td>3410 (14.53)</td>
                <td>1638 (31.69)</td>
                <td>1088 (31.91)</td>
                <td>Patient is experiencing muscle pain, secondary to <italic>statin</italic> therapy for <italic>coronary artery disease</italic></td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>36,348 (100.00)</td>
                <td>23,462 (100.00)</td>
                <td>2971 (8.17)</td>
                <td>1947 (8.30)</td>
                <td>N/A<sup>c</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Italics indicate entities participating in the specified relation type.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ADE: adverse drug event.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Preprocessing</title>
        <p>Sentence boundary detection (SBD) and tokenization are often treated as solved problems in NLP and carried out using off-the-shelf toolkits such as Apache Natural Language Toolkit [<xref ref-type="bibr" rid="ref68">68</xref>], Explosion AI spaCy [<xref ref-type="bibr" rid="ref69">69</xref>] or the Stanford CoreNLP toolkit [<xref ref-type="bibr" rid="ref70">70</xref>]. However, these are still difficult and critical problems [<xref ref-type="bibr" rid="ref71">71</xref>] in the clinical domain because (1) sentence ends are frequently indicated by layout and not by punctuation and (2) white space is not always present to indicate token boundaries (eg, <italic>50 mg</italic>). To address these issues, we incorporated domain-specific rules sensitive to low-level features such as capitalization, text-wrap properties, indentation, and punctuation into the spaCy tokenizer and SBD models. These custom rules are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Representation Learning</title>
        <sec>
          <title>Static Word Representations</title>
          <p>Word embedding is a text vectorization technique that transforms words or subwords into vectors of real numbers. Pretrained word embeddings created using Word2Vec [<xref ref-type="bibr" rid="ref72">72</xref>], Glove [<xref ref-type="bibr" rid="ref73">73</xref>], and fastText [<xref ref-type="bibr" rid="ref74">74</xref>] have been broadly used to initialize deep learning architectures for NLP tasks and have shown substantial improvement over random initialization. Recent research [<xref ref-type="bibr" rid="ref75">75</xref>] showed that NER performance is significantly affected by the overlap between the pretrained word embedding vocabulary and the vocabulary of the target NER data set. Thus, we used Word2Vec with skip-gram to pretrain word embeddings over the Medical Information Mart for Intensive Care III (MIMIC-III) [<xref ref-type="bibr" rid="ref76">76</xref>] with the default parameters provided in a study by Mikolov et al [<xref ref-type="bibr" rid="ref72">72</xref>].</p>
        </sec>
        <sec>
          <title>Contextualized Word Representations</title>
          <p>A well-known limitation of word embedding methods is that they produce a single representation of all possible meanings of a word. To tackle these deficiencies, advanced approaches have attempted to model the word’s context into a vector representation. Embeddings from Language Models (ELMo) [<xref ref-type="bibr" rid="ref77">77</xref>] is a prominent model that generates contextualized word representations by combining the internal states of different layers in a neural language model. Bidirectional Enconder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref78">78</xref>] furthered this idea by training bidirectional transformers [<xref ref-type="bibr" rid="ref50">50</xref>] using subwords. Contextualized embeddings are particularly useful for clinical NER as entities (eg, <italic>cold</italic> as low temperature versus infection) have different meanings in different contexts. Recent research [<xref ref-type="bibr" rid="ref79">79</xref>] showed that deep learning architectures with contextualized embeddings pretrained on a large clinical corpus achieve state-of-the-art performance on several clinical NER data sets. Inspired by these, we trained contextualized representations using ELMo on MIMIC-III. Detailed explanations of ELMo and training parameters are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        </sec>
        <sec>
          <title>Knowledge Representations</title>
          <p>To introduce medical knowledge, we built knowledge representations on the FAERS, a database for postmarketing drug safety monitoring. Specifically, we used 2 tables from Adverse Event Open Learning through Universal Standardization (AEOLUS) [<xref ref-type="bibr" rid="ref14">14</xref>], a curated and standardized FAERS resource, to generate 2 separate graph embeddings. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>, <italic>standard drug_outcome count</italic> contains case frequencies for drug outcomes, including <italic>ADEs</italic>, and <italic>standard drug indication count</italic> contains case frequencies for drug indications (ie, <italic>reasons)</italic>.</p>
          <p>Let <italic>G=(D,O,E)</italic> be a weighted bipartite network, where <italic>D</italic> and <italic>O</italic> denote the set of <italic>drug concept id</italic> and <italic>outcome concept id</italic> in <italic>standard drug outcome count,</italic> and <inline-graphic xlink:href="medinform_v8i7e18417_fig6.png" xlink:type="simple" mimetype="image"/> defines the interset edges. <italic>D<sub>i</sub></italic> and <italic>O<sub>j</sub></italic> denote the <italic>i<sup>th</sup></italic> and <italic>j<sup>th</sup></italic> vertex in <italic>D</italic> and <italic>O</italic> respectively, where <italic>i</italic>={1,2, … ,&#124;<italic>D</italic>&#124;} and <italic>j</italic>={1,2, … ,&#124;<italic>O</italic>&#124;}. Each edge <inline-graphic xlink:href="medinform_v8i7e18417_fig7.png" xlink:type="simple" mimetype="image"/> carries a frequency <italic>f<sub>ij</sub></italic> provided by the <italic>drug outcome pair count</italic> field in <italic>standard drug outcome count</italic>, indicating the strength between the connected vertices <italic>D<sub>i</sub></italic> and <italic>O<sub>j</sub></italic>; if <italic>D<sub>i</sub></italic> and <italic>O<sub>j</sub></italic> are not connected, <italic>f<sub>ij</sub></italic> is set to zero. To integrate this knowledge into our proposed architecture, we computed token-level embeddings by transforming <italic>G</italic> to <italic>G’</italic> as follows:</p>
          <p>Given a <italic>drug concept id</italic> (RxNorm) or <italic>outcome concept id</italic> (Medical Dictionary for Regulatory Activities) from AEOLUS, we mapped it to its concept unique identifiers (CUIs) in UMLS [<xref ref-type="bibr" rid="ref80">80</xref>] and obtained a set of tokens from all CUI variants. Let <italic>d</italic>={<italic>d<sub>1</sub>, d<sub>2</sub>, …., d<sub>L</sub></italic>} and <italic>o</italic>={<italic>o<sub>1,</sub> o<sub>2</sub>, …., o<sub>M</sub></italic>} represent all unique drug and outcome tokens obtained from mapping all <inline-graphic xlink:href="medinform_v8i7e18417_fig8.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="medinform_v8i7e18417_fig9.png" xlink:type="simple" mimetype="image"/>. Let <inline-graphic xlink:href="medinform_v8i7e18417_fig10.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="medinform_v8i7e18417_fig11.png" xlink:type="simple" mimetype="image"/> represent 2 multivalued functions that associate each element in the set of <italic>drug concept id</italic> and <italic>outcome concept id</italic> to a set of tokens. Let <italic>G’=(d,o,e)</italic> be a weighted bipartite graph and each edge <inline-graphic xlink:href="medinform_v8i7e18417_fig12.png" xlink:type="simple" mimetype="image"/> of <italic>G’</italic> is associated with a nonnegative weight <italic>w<sub>lm</sub></italic> indicating the strength between the drug token <italic>d<sub>l</sub></italic> and the outcome token <italic>o<sub>m</sub></italic>. We calculated <italic>w<sub>lm</sub></italic> as token-level co-occurrence between <italic>d<sub>l</sub></italic> and <italic>o<sub>m</sub></italic> normalized for the drug token <italic>d<sub>l</sub></italic>:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>In <italic>w<sub>lm,</sub></italic> the numerator represents the sum of frequencies of all <italic>drug concept id</italic> and <italic>outcome concept id</italic> pairs that contain drug token <italic>d<sub>l</sub></italic> and outcome token <italic>o<sub>m</sub></italic> and the denominator represents the sum of frequencies of all pairs whose <italic>drug concept id</italic> contains the drug token <italic>d<sub>l</sub></italic>.</p>
          <p>From the generated bipartite weighted graph <italic>G’</italic>=(<italic>d,o,e</italic>), we used the LINE approach to generate <italic>drug-adverse</italic> knowledge embeddings. We used LINE because (1) relations between drugs and other concepts in the FAERS form a weighted bipartite graph with a long-tail distribution of vertex degrees and (2) it helps in embedding implicit connectivity relations between vertices of the same type. Similarly, we generated <italic>drug-reason</italic> knowledge embeddings from the <italic>standard drug indication count</italic> table. Detailed explanations of LINE and training parameters are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Excerpts from the standard drug outcome count and standard drug indication count tables from adverse event open learning through universal standardization.</p>
            </caption>
            <graphic xlink:href="medinform_v8i7e18417_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Architecture</title>
        <p>In the following sections, we present our system, illustrated in <xref rid="figure3" ref-type="fig">Figure 3</xref>, in an incremental fashion: <italic>joint method</italic>, <italic>contextual-joint</italic>, <italic>positional-joint</italic>, and <italic>knowledge-joint</italic>. A detailed explanation of the deep learning architecture, BiLSTM-CRF [<xref ref-type="bibr" rid="ref81">81</xref>], and input embeddings used in this system is included in the <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Canonical architecture of the proposed system. ADE: adverse drug event; BReason: beginning of reason annotation; CRF: conditional random field; ELMo: Embeddings from Language Models; KB: knowledge base; LSTM: long short-term memory; POS: part-of-speech.</p>
          </caption>
          <graphic xlink:href="medinform_v8i7e18417_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Joint Method</title>
          <p>We developed a <italic>drug recognition model</italic> followed by 2 joint <italic>drug-centric relation extraction models</italic> (<italic>drug−</italic>{attributes} and <italic>drug−</italic>{<italic>ADE</italic>, <italic>reason</italic>}), as explained in the following sections.</p>
        </sec>
        <sec>
          <title>Drug Recognition Model</title>
          <p>We modeled drug recognition as a sequence-labeling task using BiLSTM-CRF and a beginning, inside, and outside of a drug mention (BIO) tagging scheme. The input layer of the BiLSTM-CRF takes word, character, and part-of-speech embeddings. The word embeddings were obtained using Word2Vec representations generated using MIMIC-III. The character and part-of-speech embeddings were initialized randomly. We used CNNs [<xref ref-type="bibr" rid="ref46">46</xref>] to encode a character-level representation for a word.</p>
        </sec>
        <sec>
          <title>Drug-Centric Relation Extraction Models</title>
          <p>To extract entities and relations jointly, we used the encoding scheme proposed in [<xref ref-type="bibr" rid="ref38">38</xref>], which takes annotated sentences and produces drug-centric sequences for a specified <italic>target-drug</italic>. For sentences containing multiple identified drugs, 1 drug-centric sequence was generated for each <italic>target-drug</italic>. For example, for the sentence in <xref rid="figure4" ref-type="fig">Figure 4</xref>, the encoding scheme produced 2 labeled sequences: one with <italic>lisinopril</italic> as the <italic>target-drug</italic> and the other with <italic>mirtazapine</italic>. In each sequence, associated entities with the <italic>target-drug</italic> were labeled using a BIO scheme enhanced with their types. Hence, for the sequence generated with <italic>lisinopril</italic> as the <italic>target-drug</italic>, only <italic>30 mg</italic> and the first <italic>QHS</italic> were labeled using B and I tags, and other entities (eg, <italic>15 mg</italic>, <italic>PO</italic>, and the second <italic>QHS</italic>) were labeled as <italic>O.</italic></p>
          <p>We trained 2 separate models with the BiLSTM-CRF to jointly recognize (1) drug attributes and <italic>drug−</italic>{attributes} relations and (2) <italic>ADE, reason</italic>, and their corresponding relations (<italic>drug−</italic>{<italic>ADE</italic>, <italic>reason</italic>}). Similar to the <italic>drug recognition model</italic>, the input layer of these models takes word, character, and part-of-speech representations, with additional positional and semantic-tag embeddings. We used the positional embedding technique introduced in [<xref ref-type="bibr" rid="ref82">82</xref>] to represent the positional distance from <italic>target-drug</italic> to each word in the input context. We used 3 different semantic tags, <italic>target-drug, duplicate-target-drug,</italic> and <italic>nontarget-drugs</italic>, to represent tokens of the current <italic>target-drug</italic>, other mentions of the same <italic>target-drug</italic>, and other drugs in the input context, respectively.</p>
          <p>To handle intersentential relations, we provided adjacent sentences as an input context to the sentence containing the <italic>target-drug</italic>. We used training data to determine the optimal input context for the 2 models empirically. For the <italic>drug−</italic>{attributes} model, we determined the optimal context as the current sentence with the <italic>target-drug</italic> and the sentences preceding and following it. For the <italic>drug−</italic>{<italic>ADE, reason</italic>} model, the optimal context was the current sentence and the 4 sentences preceding and following it.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Label-encoding scheme used in drug-centric relation extraction models. B: beginning; I: inside; PO: orally; QHS: every night at bedtime.</p>
            </caption>
            <graphic xlink:href="medinform_v8i7e18417_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Contextual-Joint Model</title>
          <p>We obtained domain-specific contextualized representations for input contexts by pretraining ELMo on MIMIC-III. These contextualized representations were used to augment the representations used in the input layers of the models in the <italic>joint method</italic>. With the augmented input representations, we trained (1) a <italic>drug recognition </italic> <italic>model</italic> and (2) 2 <italic>drug-centric relation extraction </italic> <italic>models</italic> (<italic>drug−</italic>{attributes} and <italic>drug−</italic>{<italic>ADE, reason</italic>}).</p>
        </sec>
        <sec>
          <title>Positional-Joint Model</title>
          <p>As the task involves extraction of drug-centric entities and relations, we used the position-attention mechanism to extract entities and relations jointly with respect to an entity of interest (<italic>target-drug</italic>).</p>
          <p>Let <inline-graphic xlink:href="medinform_v8i7e18417_fig14.png" xlink:type="simple" mimetype="image"/> represent the hidden representations of an input sequence obtained from the BiLSTM layer of the <italic>contextual-joint model</italic>. Positional representations <inline-graphic xlink:href="medinform_v8i7e18417_fig15.png" xlink:type="simple" mimetype="image"/> were generated as follows:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig16.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig17.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig18.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>where <italic>v, W<sup>p</sup>, W<sup>t</sup>, W<sup>j</sup></italic> are parameters to be learned, and <italic>s<sub>tj</sub></italic> is the score obtained through additive attention. Position-attention computes dependencies among the hidden states: (1) <italic>h<sub>p</sub></italic> at <italic>target-drug</italic> position <italic>p</italic>, (2) <italic>h<sub>j</sub></italic> at <italic>j<sup>th</sup></italic> token in the input sequence, and (3) <italic>h<sub>t</sub></italic> at current token <italic>t</italic>. For each token <italic>j, s<sub>tj</sub></italic> is computed by (1) comparing <italic>h<sub>p</sub></italic> with <italic>h<sub>j</sub></italic> and (2) comparing <italic>h<sub>t</sub></italic> with <italic>h<sub>j</sub></italic> The comparison of <italic>h<sub>p</sub></italic> and <italic>h<sub>j</sub></italic> helps to encode <italic>target-drug</italic> (positional) information, whereas the comparison of <italic>h<sub>t</sub></italic> and <italic>h<sub>j</sub></italic> is useful for matching sentence representations against itself (self-matching) to collect contextual information. <italic>a<sub>tj</sub></italic> is the attention weight produced by the normalization of <italic>s<sub>tj</sub></italic> and is used in computing the positional representation <italic>p<sub>t</sub></italic> of the current token <italic>t</italic>. Finally, we concatenated this positional representation <italic>p<sub>t</sub></italic> with its hidden representation <italic>h<sub>t</sub></italic> to obtain <italic>u<sub>t</sub>:</italic></p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig19.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>We trained the 2 <italic>drug-centric relation extraction </italic> <italic>models</italic> (<italic>drug−</italic>{attributes} and <italic>drug−</italic>{<italic>ADE, reason</italic>}) by feeding these concatenated representations to a CRF layer. During the test phase, we used the <italic>drug recognition model</italic> from the <italic>contextual-joint</italic> for predicting <italic>drugs</italic> and the trained <italic>drug-centric relation extraction </italic> <italic>models</italic> for predicting <italic>drug−</italic>{attributes} and <italic>drug−</italic>{<italic>ADE, reason</italic>} relations.</p>
        </sec>
        <sec>
          <title>Knowledge-Joint Model</title>
          <p>As introduced earlier, background knowledge and hidden relations beyond the contextual and positional information play a crucial role in extracting <italic>drug−</italic>{<italic>ADE, reason</italic>} relations. To address this, we propose the <italic>knowledge-joint</italic> model by enhancing the <italic>positional-joint</italic> model with knowledge embeddings created using the FAERS database.</p>
          <p>Let <inline-graphic xlink:href="medinform_v8i7e18417_fig20.png" xlink:type="simple" mimetype="image"/>, <inline-graphic xlink:href="medinform_v8i7e18417_fig21.png" xlink:type="simple" mimetype="image"/> denote representations of the input sequence tokens obtained from the <italic>drug-reason</italic> and <italic>drug-adverse</italic> knowledge embeddings, respectively. Let <italic>l</italic> and <italic>m</italic> be the beginning and end indices of <italic>target-drug</italic> in the input sequence. The <italic>target-drug</italic> <italic> D<sub>r</sub></italic> and <italic>D<sub>a</sub>,</italic> corresponding to <italic>drug-reason</italic> and <italic>drug-adverse</italic> knowledge embeddings, were computed by averaging the representations of <italic>target-drug</italic> tokens:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig22.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig23.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>The <italic>target-drug</italic>–centric representations <inline-graphic xlink:href="medinform_v8i7e18417_fig24.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="medinform_v8i7e18417_fig25.png" xlink:type="simple" mimetype="image"/> were obtained by computing similarities between input sequence tokens and the <italic>target-drug</italic>:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig26.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig27.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>where <italic>w<sub>r</sub></italic> and <italic>w<sub>a</sub></italic> represent the scalar weights corresponding to <italic>drug-reason,</italic> and <italic>drug-adverse</italic> knowledge embeddings learned during training. Finally, for a token at position <italic>t</italic>, we concatenated its <italic>target-drug</italic>–centric similarities <inline-graphic xlink:href="medinform_v8i7e18417_fig28.png" xlink:type="simple" mimetype="image"/> with positional and hidden representations <italic>u<sub>t</sub></italic> to produce <italic>k<sub>t</sub></italic>:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e18417_fig29.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>We trained a <italic>drug-centric relation extraction </italic> <italic>model</italic> (<italic>drug−</italic>{<italic>ADE, reason</italic>}) by feeding these concatenated representations to a CRF layer. During the test phase, we used the <italic>drug recognition model</italic> from the <italic>contextual-joint</italic> model for predicting <italic>drugs</italic> and the trained <italic>drug−</italic>{<italic>ADE, reason</italic>} <italic>model</italic> for predicting <italic>drug−ADE</italic> and <italic>drug−reason</italic> relations.</p>
        </sec>
      </sec>
      <sec>
        <title>Evaluation Metrics and Significance Tests</title>
        <p>We evaluated the proposed system using the evaluation script released by the organizers of the n2c2 challenge to measure the lenient precision, recall, and F<sub>1</sub> scores, explained as follows. For NER, a predicted entity is considered as a true-positive if its span overlaps with a gold annotation and is the correct entity type. For relation extraction, a predicted relation is considered as a true-positive if both entities in the relation are true-positives and the relation type matches the gold annotation. We also report statistical significance on these results with 50,000 shuffles and a significance level set to .05 by using a test script released by the n2c2 organizers based on the approximate randomization test [<xref ref-type="bibr" rid="ref83">83</xref>].</p>
        <p>In the following sections, we present the results of our system. The experimental settings used to achieve these results are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Named Entity Recognition</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> presents the results for each proposed incremental approach for NER. Compared with the <italic>joint method</italic>, incorporating contextualized embeddings (<italic>contextual-joint model</italic>) improved the overall microaveraged F<sub>1</sub> score by 0.3 percentage points. The improvement was mainly observed in recognizing <italic>drugs</italic> (0.6 points), with some improvements in recognizing <italic>strength</italic> and <italic>reason</italic>. Compared with the <italic>contextual-joint model</italic>, the <italic>positional-joint model</italic> improved the overall micro-F<sub>1</sub> score by 0.2 points, with significant improvements observed in identifying <italic>reason</italic> (2.1 points) and <italic>ADE</italic> (6.8 points). Compared with the <italic>positional-joint model</italic>, the <italic>knowledge-joint model</italic> further improved the overall micro-F<sub>1</sub> score by 0.1 points, with significant improvements observed in accurately determining <italic>reason</italic> (1.9 points) and <italic>ADE</italic> (1.7 points). Note that the overall improvement between the <italic>positional-joint</italic> and <italic>knowledge-joint models</italic> is relatively small due to the biased distribution of annotations, as <italic>ADE</italic> and <italic>reason</italic> together constitute less than 10% of the entities.</p>
        <p>Significance tests showed that the improvements in micro-F<sub>1</sub> score observed with each incremental approach are statistically significant with <italic>P</italic> values of .001, &#60;.001, and &#60;.001 for the <italic>contextual-joint</italic>, <italic>positional-joint,</italic> and <italic>knowledge-joint</italic> models, respectively. As the <italic>contextual-joint</italic> and <italic>positional-joint models</italic> share the same <italic>drug recognition model</italic>, we ignored drug predictions when performing significance tests. Similarly, the <italic>positional-joint</italic> and <italic>knowledge-joint</italic> models share the same <italic>drug recognition model</italic> and <italic>drug−</italic>{attributes} <italic>model;</italic> therefore, we considered only <italic>ADE</italic> and <italic>reason</italic> predictions when performing significance tests.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Lenient precision, recall, and F1 score of the proposed approaches for named entity recognition.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td>Entity type</td>
                <td colspan="3">Joint</td>
                <td colspan="3">Contextual-joint</td>
                <td colspan="3">Positional-joint</td>
                <td colspan="3">Knowledge-joint</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Drug</td>
                <td>0.956</td>
                <td>0.952</td>
                <td>0.954</td>
                <td>0.956</td>
                <td>0.964</td>
                <td>0.960</td>
                <td>0.956</td>
                <td>0.964</td>
                <td>0.960</td>
                <td>0.956</td>
                <td>0.964</td>
                <td>0.960</td>
              </tr>
              <tr valign="top">
                <td>Strength</td>
                <td>0.980</td>
                <td>0.969</td>
                <td>0.974</td>
                <td>0.982</td>
                <td>0.971</td>
                <td>0.976</td>
                <td>0.985</td>
                <td>0.976</td>
                <td>0.980</td>
                <td>0.985</td>
                <td>0.976</td>
                <td>0.980</td>
              </tr>
              <tr valign="top">
                <td>Form</td>
                <td>0.974</td>
                <td>0.942</td>
                <td>0.958</td>
                <td>0.975</td>
                <td>0.939</td>
                <td>0.957</td>
                <td>0.972</td>
                <td>0.943</td>
                <td>0.958</td>
                <td>0.972</td>
                <td>0.943</td>
                <td>0.958</td>
              </tr>
              <tr valign="top">
                <td>Frequency</td>
                <td>0.981</td>
                <td>0.958</td>
                <td>0.970</td>
                <td>0.981</td>
                <td>0.958</td>
                <td>0.969</td>
                <td>0.979</td>
                <td>0.964</td>
                <td>0.971</td>
                <td>0.979</td>
                <td>0.964</td>
                <td>0.971</td>
              </tr>
              <tr valign="top">
                <td>Route</td>
                <td>0.964</td>
                <td>0.942</td>
                <td>0.953</td>
                <td>0.962</td>
                <td>0.943</td>
                <td>0.952</td>
                <td>0.950</td>
                <td>0.949</td>
                <td>0.949</td>
                <td>0.950</td>
                <td>0.949</td>
                <td>0.949</td>
              </tr>
              <tr valign="top">
                <td>Dosage</td>
                <td>0.943</td>
                <td>0.938</td>
                <td>0.941</td>
                <td>0.941</td>
                <td>0.937</td>
                <td>0.939</td>
                <td>0.936</td>
                <td>0.957</td>
                <td>0.946</td>
                <td>0.936</td>
                <td>0.957</td>
                <td>0.946</td>
              </tr>
              <tr valign="top">
                <td>Duration</td>
                <td>0.887</td>
                <td>0.788</td>
                <td>0.835</td>
                <td>0.914</td>
                <td>0.791</td>
                <td>0.848</td>
                <td>0.880</td>
                <td>0.815</td>
                <td>0.846</td>
                <td>0.880</td>
                <td>0.815</td>
                <td>0.846</td>
              </tr>
              <tr valign="top">
                <td>ADE<sup>a</sup></td>
                <td>0.649</td>
                <td>0.358</td>
                <td>0.462</td>
                <td>0.643</td>
                <td>0.346</td>
                <td>0.450</td>
                <td>0.660</td>
                <td>0.426</td>
                <td>0.518</td>
                <td>0.589</td>
                <td>0.490</td>
                <td>0.535</td>
              </tr>
              <tr valign="top">
                <td>Reason</td>
                <td>0.757</td>
                <td>0.611</td>
                <td>0.676</td>
                <td>0.747</td>
                <td>0.636</td>
                <td>0.687</td>
                <td>0.747</td>
                <td>0.672</td>
                <td>0.708</td>
                <td>0.753</td>
                <td>0.702</td>
                <td>0.727</td>
              </tr>
              <tr valign="top">
                <td>Overall (micro)</td>
                <td>0.948</td>
                <td>0.912</td>
                <td>0.929</td>
                <td>0.947</td>
                <td>0.917</td>
                <td>0.932</td>
                <td>0.943</td>
                <td>0.926</td>
                <td>0.934</td>
                <td>0.941</td>
                <td>0.930</td>
                <td>0.935</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>ADE: adverse drug event.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Relation Extraction</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> presents the results for each proposed incremental approach for relation extraction. Compared with the <italic>joint method</italic>, the <italic>contextual-joint</italic> model improved the overall micro-F1 score by 0.5 percentage points, with the majority of improvements observed in accurately recognizing <italic>drug−strength, drug−frequency, drug−reason,</italic> and <italic>drug−dosage relations</italic>. Compared with the <italic>contextual-joint model</italic>, the <italic>positional-joint model</italic> improved the F<sub>1</sub> score by 0.4 points with significant improvements observed in determining <italic>drug−ADE</italic> (5.6 points) and <italic>drug−reason</italic> (2.9 points) relations. <italic>The knowledge-joint model</italic> further improved the overall F<sub>1</sub> score by 0.1 points, with specific improvements in <italic>drug−ADE</italic> by 3.0 points and <italic>drug−reason</italic> by 1.7 points when compared with the <italic>positional-joint model</italic>. Similar to the NER significance results, significance testing for relation extraction showed that the improvements observed with each incremental approach are statistically significant with <italic>P</italic> values of &#60;.001, &#60;.001, and &#60;.001 for the <italic>contextual-joint</italic>, <italic>positional-joint</italic>, and <italic>knowledge-joint</italic> models, respectively.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Lenient precision, recall, and F1 score of the proposed approaches for relation extraction.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="130"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="80"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="80"/>
            <col width="60"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td>Relation type</td>
                <td colspan="4">Joint</td>
                <td colspan="4">Contextual-joint</td>
                <td colspan="4">Positional-joint</td>
                <td colspan="3">Knowledge-joint</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td colspan="2">
                  Precision
                </td>
                <td>
                 Recall
                </td>
                <td>F<sub>1</sub> score</td>
                <td colspan="2">Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td colspan="2">Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Drug−strength</td>
                <td>0.966</td>
                <td>0.962</td>
                <td>0.964</td>
                <td colspan="2">0.977</td>
                <td>0.964</td>
                <td>0.971</td>
                <td colspan="2">0.978</td>
                <td>0.971</td>
                <td>0.975</td>
                <td colspan="2">0.978</td>
                <td>0.971</td>
                <td>0.975</td>
              </tr>
              <tr valign="top">
                <td>Drug−form</td>
                <td>0.963</td>
                <td>0.936</td>
                <td>0.949</td>
                <td colspan="2">0.972</td>
                <td>0.936</td>
                <td>0.953</td>
                <td colspan="2">0.969</td>
                <td>0.939</td>
                <td>0.954</td>
                <td colspan="2">0.969</td>
                <td>0.939</td>
                <td>0.954</td>
              </tr>
              <tr valign="top">
                <td>Drug−frequency</td>
                <td>0.961</td>
                <td>0.949</td>
                <td>0.955</td>
                <td colspan="2">0.972</td>
                <td>0.950</td>
                <td>0.961</td>
                <td colspan="2">0.969</td>
                <td>0.955</td>
                <td>0.962</td>
                <td colspan="2">0.969</td>
                <td>0.955</td>
                <td>0.962</td>
              </tr>
              <tr valign="top">
                <td>Drug−route</td>
                <td>0.943</td>
                <td>0.931</td>
                <td>0.937</td>
                <td colspan="2">0.954</td>
                <td>0.933</td>
                <td>0.943</td>
                <td colspan="2">0.936</td>
                <td>0.939</td>
                <td>0.937</td>
                <td colspan="2">0.936</td>
                <td>0.939</td>
                <td>0.937</td>
              </tr>
              <tr valign="top">
                <td>Drug−dosage</td>
                <td>0.921</td>
                <td>0.928</td>
                <td>0.924</td>
                <td colspan="2">0.933</td>
                <td>0.931</td>
                <td>0.932</td>
                <td colspan="2">0.925</td>
                <td>0.950</td>
                <td>0.937</td>
                <td colspan="2">0.925</td>
                <td>0.950</td>
                <td>0.937</td>
              </tr>
              <tr valign="top">
                <td>Drug−duration</td>
                <td>0.814</td>
                <td>0.718</td>
                <td>0.763</td>
                <td colspan="2">0.880</td>
                <td>0.723</td>
                <td>0.794</td>
                <td colspan="2">0.823</td>
                <td>0.739</td>
                <td>0.779</td>
                <td colspan="2">0.823</td>
                <td>0.739</td>
                <td>0.779</td>
              </tr>
              <tr valign="top">
                <td>Drug−ADE<sup>a</sup></td>
                <td>0.590</td>
                <td>0.322</td>
                <td>0.417</td>
                <td colspan="2">0.592</td>
                <td>0.307</td>
                <td>0.404</td>
                <td colspan="2">0.590</td>
                <td>0.377</td>
                <td>0.460</td>
                <td colspan="2">0.544</td>
                <td>0.446</td>
                <td>0.490</td>
              </tr>
              <tr valign="top">
                <td>Drug−reason</td>
                <td>0.682</td>
                <td>0.526</td>
                <td>0.594</td>
                <td colspan="2">0.676</td>
                <td>0.546</td>
                <td>0.604</td>
                <td colspan="2">0.680</td>
                <td>0.593</td>
                <td>0.633</td>
                <td colspan="2">0.673</td>
                <td>0.628</td>
                <td>0.650</td>
              </tr>
              <tr valign="top">
                <td>Overall (micro)</td>
                <td>0.912</td>
                <td>0.859</td>
                <td>0.885</td>
                <td colspan="2">0.920</td>
                <td>0.862</td>
                <td>0.890</td>
                <td colspan="2">0.912</td>
                <td>0.877</td>
                <td>0.894</td>
                <td colspan="2">0.906</td>
                <td>0.884</td>
                <td>0.895</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>ADE: adverse drug event.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Contextualized representations (<italic>contextual-joint</italic>) are effective in differentiating between words and abbreviations that could have multiple meanings. For example, <italic>ensure</italic> and <italic>contrast</italic> can be understood as either a <italic>drug</italic> (“Ensure: 1 can PO three times daily” and “contrast-induced nephropathy”) or a verb, and terms such as <italic>blood</italic> could either refer to a drug (“transfused 1 unit of blood”), that is, substance given to a patient, a test for the drug (“blood alcohol concentration”), or a natural occurring substance in the body (“blood pressure”). Additionally, abbreviations such as <italic>PE</italic> (physical examination versus pulmonary embolism) and <italic>pcp</italic> (primary care physician versus pneumocystis pneumonia) can have multiple expansions. In all the examples above, the <italic>contextual-joint</italic> correctly identifies these entities.</p>
        <p>One prevailing challenge in ADE extraction is the presence of long-distance or intersentential relations. As shown in <xref ref-type="table" rid="table2">Table 2</xref>, a significant portion of <italic>drug</italic>−{<italic>ADE, reason</italic>} in the data set is intersentential (23% of <italic>drug</italic>−<italic>ADE</italic> and 31.7% of <italic>drug</italic>−<italic>reason</italic>). These relations typically span long distances, making them more difficult to capture. To study the effectiveness of the proposed approaches over long-distance relations, we calculated the F<sub>1</sub> scores on <italic>drug</italic>−{<italic>ADE, reason</italic>} with an increasing number of tokens between entities. As shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, we find that the positional<italic>-joint</italic> model performs significantly better than the <italic>contextual-joint</italic> model with increasing distance between entities, suggesting that the <italic>positional-joint</italic> can effectively model long-distance relations.</p>
        <p>Incorporating knowledge embeddings learned on the FAERS improved <italic>drug</italic>−{<italic>ADE, reason</italic>} relation extraction, especially in the case of long-distance relations or when contextual clues are insufficient. As shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, <italic>the knowledge-joint</italic> model further improved on the <italic>positional-joint</italic> model at all distances. The <italic>knowledge-joint</italic> model was also useful in cases of insufficient or ambiguous context in extracting the correct relation. For example, in the phrase “Wellbutrin - nausea and vomiting,” the relation is indicated only by an uninformative hyphen, with no contextual clues to indicate the type of relation. Similarly, in “Patient had history of depression and was on elavil previously,” it is unclear whether the <italic>history of depression</italic> was previously treated by <italic>drug</italic>−<italic>reason</italic> or caused by <italic>drug</italic>−<italic>ADE</italic> of the drug <italic>elavil</italic>. Furthermore, the <italic>knowledge-joint</italic> also helped to extract correct relations when multiple drugs and candidate <italic>ADEs</italic> and <italic>reasons</italic> are discussed in a given context. For example, in “Upon arrival, she was hypertensive and had a fever. She was given Tylenol<italic>,</italic>” based on sentence construction, 2 candidate <italic>reasons</italic> (<italic>hypertensive</italic> and <italic>fever</italic>) may be associated with the <italic>drug</italic> <italic>Tylenol</italic>. Knowledge is required to infer that of the two, only <italic>fever</italic> is related to <italic>Tylenol</italic>.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>F1 scores of approaches with increasing distance between entities for relation extraction. ADE: adverse drug event.</p>
          </caption>
          <graphic xlink:href="medinform_v8i7e18417_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Error Analysis</title>
        <p>We investigated the most common error categories by entity and relation type and present these in <xref ref-type="table" rid="table5">Table 5</xref>. Most of the errors in recognizing <italic>drug</italic>s were due to abbreviations, misspellings, generic terms, or linguistic shorthand. For <italic>strength</italic> and <italic>dosage</italic>, these entities were often mislabeled as each other—both are often numeric quantities and used in similar contexts. For <italic>duration</italic> and <italic>frequency</italic>, most of the errors resulted from these entities being expressed in colloquial language.</p>
        <p>Intersentential relations remain a major category of false-negative errors for all relations despite improvements from the position-attention mechanism. For <italic>drug−</italic>{attributes}, these errors were likely due to an insufficient number of such examples in the training data (approximately 4%). In addition to errors from intersentential relations, other important categories for false-negative <italic>drug−</italic>{<italic>ADE, reason</italic>} include (1) <italic>ADE</italic> or <italic>reasons</italic> expressed in generic terms, (2) <italic>reasons</italic> such as procedures and activities (eg, <italic>angioplasty/stenting</italic>) that occur infrequently in the training set<italic>,</italic> and (3) <italic>ADE</italic> or <italic>reasons</italic> expressed as abbreviations that are nonstandard or ambiguous<italic>.</italic></p>
        <p>False-positive errors in <italic>drug−</italic>{<italic>ADE</italic>, <italic>reason</italic>} mainly fall into 2 categories. In the first, one of the entities participating in the relation is negated, hypothetical, or conditional, such as when a drug is withheld to avoid an anticipated ADE (eg, contraindications). In the second, the same concept (<italic>drug</italic>, <italic>ADE</italic>, or <italic>reason</italic>) is mentioned multiple times in the same context, and the system associated the relation to one mention whereas the ground truth to the other. To add further complexity, these mentions may be synonyms, for example, “the pain medications (morphine, vicodin, codeine) worsened your mental status and made you delirious.” With multiple possible <italic>drug</italic>−<italic>ADE</italic> relations, some combinations were not captured in the ground truth, resulting in false-positives that may not be true errors.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Error analysis on our best-performing model (knowledge-joint).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="280"/>
            <col width="440"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Entity/relation, Error category</td>
                <td>Text<sup>a</sup></td>
                <td>Explanation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Drug</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Abbreviation</td>
                <td>Hyponatremia due to <italic>HCTZ</italic><sup>b</sup></td>
                <td>HCTZ—abbreviated drug</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Misspelled words</td>
                <td>30 units of Lantus in addition to <italic>humalong</italic></td>
                <td>Humalog is incorrectly written as humalong</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Short forms</td>
                <td>She was given <italic>vanco</italic></td>
                <td>Vancomycin is expressed in shorthand</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Generic phrase</td>
                <td>He was advised to not take any of his <italic>blood pressure medications</italic></td>
                <td>Antihypertensives are expressed through generic terms</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Strength</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Contextual ambiguity</td>
                <td>Patient received <italic>1 unit</italic> of <italic>blood</italic></td>
                <td><italic>Strength</italic> (<italic>1 unit</italic>) wrongly predicted as <italic>dosage</italic>; usually, the <italic>unit</italic> token is associated with <italic>dosage</italic></td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Duration</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Colloquial language</td>
                <td>Only take <italic>Hydroxyzine</italic> <italic> as long as your rash is itching</italic></td>
                <td><italic>Duration</italic> is expressed colloquially</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Drug</bold>
                  <bold>−</bold>
                  <bold>strength</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intersentential</td>
                <td>Continued <italic>Carvedilol</italic>. INR<sup>c</sup> initially slightly supratherapeutic, but then his home regimen of <italic>4mg</italic> alternating with <italic>2mg</italic> daily was started</td>
                <td>Intersentential relation between carvedilol and 4 mg</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Drug</bold>
                  <bold>−</bold>
                  <bold>ADE<sup>d</sup></bold>
                  <bold>; Drug</bold>
                  <bold>−</bold>
                  <bold>reason</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intersentential</td>
                <td>He underwent <italic>coronary artery bypass</italic> x5, please see operative report for further details. He was transferred to the CSRU<sup>e</sup> on <italic>Neo</italic> with IABP<sup>f</sup></td>
                <td>Intersentential relation between neo and coronary artery bypass graft</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Generic terms</td>
                <td>Start a baby <italic>aspirin</italic> every day to <italic>protect the heart</italic></td>
                <td><italic>Reason</italic> is expressed in generic terms</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Abbreviation</td>
                <td><italic>Detrol</italic> was discontinued on suspicion that it might contribute to <italic>AMS</italic></td>
                <td><italic>AMS</italic> has multiple possible expansions</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Procedure</td>
                <td><italic>Angioplasty</italic> of the left tibial artery; had been on <italic>Plavix</italic> prior to NSTEMI<sup>g</sup></td>
                <td>Procedure angioplasty is annotated as <italic>reason</italic></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Contraindication</td>
                <td>Avoiding <italic>NSAIDs</italic><sup>h</sup> to prevent <italic>gastrointestinal bleed</italic></td>
                <td><italic>Drug</italic> was not given to this patient</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Negated</td>
                <td><italic>Heparin</italic>-induced <italic>thrombocytopenia</italic> negative</td>
                <td><italic>ADE</italic> thrombocytopenia is negated</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Italics indicate text that contributes to the specified error category.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>HCTZ: hydrochlorothiazide.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>INR: international normalized ratio.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>ADE: adverse drug event.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>CSRU: cardiac surgery recovery unit.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>IABP: intra-aortic balloon pump.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>NSTEMI: non–ST-elevation myocardial infarction.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>NSAIDs: nonsteroidal anti-inflammatory drugs.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Document-Level Analysis</title>
        <p>From an end user perspective, the core information needed for patient care purposes is a patient-level summary of these relations, which is a unique set of extracted relations after normalization. To evaluate our system for this purpose, we measured <italic>drug−ADE</italic> and <italic>drug−reason</italic> F<sub>1</sub> scores by considering unique pairs of relation mentions at the document level, presented in <xref ref-type="table" rid="table6">Table 6</xref>. We observed scores at the document level to be 1 to 2 percentage points higher than the instance level.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Document-level analysis for drug−reason and drug−adverse drug event relations.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="90"/>
            <col width="70"/>
            <col width="80"/>
            <col width="90"/>
            <col width="60"/>
            <col width="80"/>
            <col width="80"/>
            <col width="60"/>
            <col width="70"/>
            <col width="80"/>
            <col width="60"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td colspan="6">Drug−reason</td>
                <td colspan="6">Drug−ADE<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Instance level</td>
                <td colspan="3">Document level</td>
                <td colspan="3">Instance level</td>
                <td colspan="3">Document level</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
                <td>Precision</td>
                <td>Recall</td>
                <td>F<sub>1</sub> score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Joint</td>
                <td>0.682</td>
                <td>0.526</td>
                <td>0.594</td>
                <td>0.691</td>
                <td>0.542</td>
                <td>0.607</td>
                <td>0.590</td>
                <td>0.322</td>
                <td>0.417</td>
                <td>0.631</td>
                <td>0.322</td>
                <td>0.426</td>
              </tr>
              <tr valign="top">
                <td>Contextual-joint</td>
                <td>0.675</td>
                <td>0.546</td>
                <td>0.604</td>
                <td>0.685</td>
                <td>0.560</td>
                <td>0.616</td>
                <td>0.592</td>
                <td>0.307</td>
                <td>0.404</td>
                <td>0.630</td>
                <td>0.308</td>
                <td>0.414</td>
              </tr>
              <tr valign="top">
                <td>Position-joint</td>
                <td>0.680</td>
                <td>0.593</td>
                <td>0.633</td>
                <td>0.692</td>
                <td>0.611</td>
                <td>0.649</td>
                <td>0.590</td>
                <td>0.376</td>
                <td>0.460</td>
                <td>0.647</td>
                <td>0.384</td>
                <td>0.482</td>
              </tr>
              <tr valign="top">
                <td>Knowledge-joint</td>
                <td>0.673</td>
                <td>0.628</td>
                <td>0.650</td>
                <td>0.687</td>
                <td>0.647</td>
                <td>0.666</td>
                <td>0.544</td>
                <td>0.446</td>
                <td>0.490</td>
                <td>0.579</td>
                <td>0.444</td>
                <td>0.503</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>ADE: adverse drug event.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparison With Previous Work</title>
        <p>For NER, the state-of-the-art system [<xref ref-type="bibr" rid="ref38">38</xref>] used an ensemble (committee) of 3 different methods: CRF, BiLSTM-CRF, and joint approach. They showed that the BiLSTM-CRF is the best among the single models. Thus, we compare our best model (<italic>knowledge-joint</italic>) with their best-performing single model and committee approach, as shown in <xref ref-type="table" rid="table7">Table 7</xref>. Overall, <italic>the knowledge-joint</italic> model outperformed the single model by 0.2 percentage points and achieved similar micro-F<sub>1</sub> to the committee approach. Notably, <italic>the knowledge-joint</italic> model significantly outperformed the committee approach in recognizing the crucial <italic>ADE</italic> (0.5 points) and <italic>reason</italic> (5.2 points) entities.</p>
        <p>For relation extraction, the state-of-the-art system used the committee approach for NER, convolutional neural network – recurrent neural network (CNN-RNN) for relation classification, and postprocessing rules. Although postprocessing rules are commonly used in competitions, they often do not generalize across data sets and therefore are of limited interest in this research. As shown in <xref ref-type="table" rid="table7">Table 7</xref>, <italic>the knowledge-joint model</italic> outperformed the state-of-the-art approach, both with (0.4 points) and without rules (1.6 points). Notably, <italic>the knowledge-joint</italic> model achieved the best results and outperformed the state-of-the-art in recognizing the most crucial and difficult to extract relations: <italic>drug−reason</italic> (7.1 points) and <italic>drug−ADE</italic> (1.4 points).</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>The lenient F1 scores for named entity recognition of single and state-of-the-art ensemble models compared with our best model. The lenient F1 scores for relation extraction of state-of-the-art ensemble models with and without rules, compared with our best model.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="130"/>
            <col width="140"/>
            <col width="130"/>
            <col width="0"/>
            <col width="160"/>
            <col width="110"/>
            <col width="110"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="5">NER<sup>a</sup></td>
                <td colspan="4">Relation extraction</td>
              </tr>
              <tr valign="top">
                <td>Entity type</td>
                <td>BiLSTM-CRF<sup>b</sup> [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Committee [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Knowledge-joint</td>
                <td colspan="2">Relation type</td>
                <td>Committee + CNN-RNN<sup>c</sup> [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Committee + CNN-RNN + Rules [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Knowledge-joint</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Drug</td>
                <td>0.955</td>
                <td>0.956</td>
                <td>0.960</td>
                <td colspan="2">N/A<sup>d</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Strength</td>
                <td>0.982</td>
                <td>0.983</td>
                <td>0.980</td>
                <td colspan="2">Drug−strength</td>
                <td>0.964</td>
                <td>0.972</td>
                <td>0.975</td>
              </tr>
              <tr valign="top">
                <td>Form</td>
                <td>0.958</td>
                <td>0.958</td>
                <td>0.958</td>
                <td colspan="2">Drug−form</td>
                <td>0.940</td>
                <td>0.952</td>
                <td>0.954</td>
              </tr>
              <tr valign="top">
                <td>Frequency</td>
                <td>0.974</td>
                <td>0.975</td>
                <td>0.971</td>
                <td colspan="2">Drug−frequency</td>
                <td>0.941</td>
                <td>0.958</td>
                <td>0.962</td>
              </tr>
              <tr valign="top">
                <td>Route</td>
                <td>0.956</td>
                <td>0.956</td>
                <td>0.949</td>
                <td colspan="2">Drug−route</td>
                <td>0.930</td>
                <td>0.942</td>
                <td>0.937</td>
              </tr>
              <tr valign="top">
                <td>Dosage</td>
                <td>0.943</td>
                <td>0.948</td>
                <td>0.946</td>
                <td colspan="2">Drug−dosage</td>
                <td>0.923</td>
                <td>0.935</td>
                <td>0.937</td>
              </tr>
              <tr valign="top">
                <td>Duration</td>
                <td>0.856</td>
                <td>0.862</td>
                <td>0.846</td>
                <td colspan="2">Drug−duration</td>
                <td>0.740</td>
                <td>0.786</td>
                <td>0.779</td>
              </tr>
              <tr valign="top">
                <td>ADE<sup>e</sup></td>
                <td>0.422</td>
                <td>0.530</td>
                <td>0.535</td>
                <td colspan="2">Drug−ADE</td>
                <td>0.475</td>
                <td>0.476</td>
                <td>0.490</td>
              </tr>
              <tr valign="top">
                <td>Reason</td>
                <td>0.680</td>
                <td>0.675</td>
                <td>0.727</td>
                <td colspan="2">Drug−reason</td>
                <td>0.572</td>
                <td>0.579</td>
                <td>0.650</td>
              </tr>
              <tr valign="top">
                <td>Overall (micro)</td>
                <td>0.933</td>
                <td>0.935</td>
                <td>0.935</td>
                <td colspan="2">Overall (micro)</td>
                <td>0.879</td>
                <td>0.891</td>
                <td>0.895</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>NER: named entity recognition.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>BiLSTM-CRF: bidirectional long short-term memory–conditional random field.</p>
            </fn>
            <fn id="table7fn3">
              <p><sup>c</sup>CNN-RNN: convolutional neural network–recurrent neural network.</p>
            </fn>
            <fn id="table7fn4">
              <p><sup>d</sup>Not applicable.</p>
            </fn>
            <fn id="table7fn5">
              <p><sup>e</sup>ADE: adverse drug event.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>We acknowledge several limitations of this study. First, these results are specific to the n2c2 data set, which contains only intensive care unit (ICU) discharge summaries from a single health care organization. Ground truth generation and evaluation on a more diverse data set is needed to better understand the effectiveness of these proposed approaches. Second, we observed some annotation errors in the ground truth, likely due to the complex nature of the task. Further investigation is needed to quantify the prevalence of such errors and their impact on the results.</p>
        <p>Despite achieving state-of-the-art results, the proposed system still has room for improvement, specifically in recognizing intersentential <italic>drug</italic>−{<italic>ADE</italic>, <italic>reason</italic>} relations. To further improve ADE extraction, we plan to explore the following research areas:</p>
        <list list-type="order">
          <list-item>
            <p>Although we incorporated knowledge graph embeddings, other advanced methods that use higher-order proximity and role-preserving network embedding techniques have shown promising results in the general domain. We plan to explore methods such as Edge Label Aware Network Embedding [<xref ref-type="bibr" rid="ref84">84</xref>] rather than training separate graph embeddings for <italic>drug−{ADE, reason}</italic> relations.</p>
          </list-item>
          <list-item>
            <p>The field of contextual embeddings has evolved quickly along with the release of newer language representation models trained on clinical text. We plan to explore BERT [<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref85">85</xref>], which utilizes a transformer network to pretrain a language model for extracting better contextual word embeddings.</p>
          </list-item>
          <list-item>
            <p>To address some of the findings from the error analysis, we plan to leverage our clinical abbreviation expansion components [<xref ref-type="bibr" rid="ref86">86</xref>] to help resolve ambiguous mentions and also incorporate assertion recognition [<xref ref-type="bibr" rid="ref26">26</xref>] to capture the belief state of the physician on a concept (negated, hypothetical, conditional).</p>
          </list-item>
          <list-item>
            <p>As mentioned earlier, the proposed models performed poorly on intersentential relation extraction. To address this, we plan to explore N-ary relation extraction for cross-sentence relation extraction using graph long short-term memory networks [<xref ref-type="bibr" rid="ref87">87</xref>].</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We presented a system for extracting drug-centric concepts and relations that outperformed current state-of-the-art results. Experimental results showed that contextualized embeddings, position-attention mechanisms, and knowledge embeddings effectively improve deep learning-based concepts and relation extraction. Specifically, we showed the effectiveness of a position-attention mechanism in extracting long-distance relations and knowledge embeddings from the FAERS in recognizing relations where contextual clues are insufficient.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Sentence segmentation and tokenization.</p>
        <media xlink:href="medinform_v8i7e18417_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 392 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Embeddings from Language Models contextualized embeddings and large-scale information network embedding graph embeddings.</p>
        <media xlink:href="medinform_v8i7e18417_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 142 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Detailed explanation of bidirectional long short-term memory–conditional random fields and input embeddings.</p>
        <media xlink:href="medinform_v8i7e18417_app3.pdf" xlink:title="PDF File  (Adobe PDF File), 369 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Experimental settings used in the proposed system.</p>
        <media xlink:href="medinform_v8i7e18417_app4.pdf" xlink:title="PDF File  (Adobe PDF File), 106 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ADE</term>
          <def>
            <p>adverse drug event</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AEOLUS</term>
          <def>
            <p>adverse event open learning through universal standardization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BERT</term>
          <def>
            <p>Bidirectional Enconder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BiLSTM-CRF</term>
          <def>
            <p>bidirectional, long short-term memory–conditional random fields</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">BIO</term>
          <def>
            <p>beginning, inside, and outside</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">CRF</term>
          <def>
            <p>conditional random field</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">CUI</term>
          <def>
            <p>concept unique identifier</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ELMo</term>
          <def>
            <p>Embeddings from Language Models</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">FAERS</term>
          <def>
            <p>Food and Drug Administration Adverse Event Reporting System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LINE</term>
          <def>
            <p>large-scale information network embedding</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">MADE 1.0</term>
          <def>
            <p>Medication and Adverse Drug Events from Electronic Health Records</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">MIMIC-III</term>
          <def>
            <p>Medical Information Mart for Intensive Care III</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">n2c2</term>
          <def>
            <p>2018 National NLP Clinical Challenges</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">SBD</term>
          <def>
            <p>sentence boundary detection</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors wish to thank Dr Kenneth J Barker for his assistance in providing valuable feedback on the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gunter</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Terry</surname>
              <given-names>NP</given-names>
            </name>
          </person-group>
          <article-title>The emergence of national electronic health record architectures in the United States and Australia: models, costs, and questions</article-title>
          <source>J Med Internet Res</source>
          <year>2005</year>
          <month>03</month>
          <day>14</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e3</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2005/1/e3/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7.1.e3</pub-id>
          <pub-id pub-id-type="medline">15829475</pub-id>
          <pub-id pub-id-type="pii">v7e3</pub-id>
          <pub-id pub-id-type="pmcid">PMC1550638</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenbloom</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stead</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Giuse</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lorenzi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Generating clinical notes for electronic health record systems</article-title>
          <source>Appl Clin Inform</source>
          <year>2010</year>
          <month>01</month>
          <day>1</day>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>232</fpage>
          <lpage>43</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21031148"/>
          </comment>
          <pub-id pub-id-type="doi">10.4338/ACI-2010-03-RA-0019</pub-id>
          <pub-id pub-id-type="medline">21031148</pub-id>
          <pub-id pub-id-type="pmcid">PMC2963994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Cullen</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Laird</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Petersen</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Small</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Servi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Laffel</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sweitzer</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shea</surname>
              <given-names>BF</given-names>
            </name>
            <name name-style="western">
              <surname>Hallisey</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Incidence of adverse drug events and potential adverse drug events. Implications for prevention. ADE prevention study group</article-title>
          <source>J Am Med Assoc</source>
          <year>1995</year>
          <month>07</month>
          <day>5</day>
          <volume>274</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="medline">7791255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Bootman</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Drug-related morbidity and mortality. A cost-of-illness model</article-title>
          <source>Arch Intern Med</source>
          <year>1995</year>
          <month>10</month>
          <day>9</day>
          <volume>155</volume>
          <issue>18</issue>
          <fpage>1949</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="medline">7575048</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Classen</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Pestotnik</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Lloyd</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug events in hospitalized patients. Excess length of stay, extra costs, and attributable mortality</article-title>
          <source>J Am Med Assoc</source>
          <year>1997</year>
          <volume>277</volume>
          <issue>4</issue>
          <fpage>301</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="medline">9002492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiatti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bustacchini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Furneri</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mantovani</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cristiani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Misuraca</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lattanzio</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>The economic burden of inappropriate drug prescribing, lack of adherence and compliance, adverse drug events in older people: a systematic review</article-title>
          <source>Drug Saf</source>
          <year>2012</year>
          <month>01</month>
          <volume>35</volume>
          <issue>Suppl 1</issue>
          <fpage>73</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.1007/BF03319105</pub-id>
          <pub-id pub-id-type="medline">23446788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>SR</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug event monitoring at the Food and Drug Administration</article-title>
          <source>J Gen Intern Med</source>
          <year>2003</year>
          <month>01</month>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>57</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=0884-8734&#38;date=2003&#38;volume=18&#38;issue=1&#38;spage=57"/>
          </comment>
          <pub-id pub-id-type="doi">10.1046/j.1525-1497.2003.20130.x</pub-id>
          <pub-id pub-id-type="medline">12534765</pub-id>
          <pub-id pub-id-type="pii">jgi20130</pub-id>
          <pub-id pub-id-type="pmcid">PMC1494803</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hazell</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shakir</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Under-reporting of adverse drug reactions: a systematic review</article-title>
          <source>Drug Saf</source>
          <year>2006</year>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>385</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.2165/00002018-200629050-00003</pub-id>
          <pub-id pub-id-type="medline">16689555</pub-id>
          <pub-id pub-id-type="pii">2953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Fernald</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>A novel signal detection algorithm for identifying hidden drug-drug interactions in adverse event reports</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2012</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>79</fpage>
          <lpage>85</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21676938"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000214</pub-id>
          <pub-id pub-id-type="medline">21676938</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000214</pub-id>
          <pub-id pub-id-type="pmcid">PMC3240755</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pirmohamed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Meakin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Walley</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Farrar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Breckenridge</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug reactions as cause of admission to hospital: prospective analysis of 18 820 patients</article-title>
          <source>Br Med J</source>
          <year>2004</year>
          <month>07</month>
          <day>3</day>
          <volume>329</volume>
          <issue>7456</issue>
          <fpage>15</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/15231615"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.329.7456.15</pub-id>
          <pub-id pub-id-type="medline">15231615</pub-id>
          <pub-id pub-id-type="pii">329/7456/15</pub-id>
          <pub-id pub-id-type="pmcid">PMC443443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haerian</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Varn</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vaidya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ena</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chase</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Detection of pharmacovigilance-related adverse events using electronic health records and automated methods</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2012</year>
          <month>08</month>
          <volume>92</volume>
          <issue>2</issue>
          <fpage>228</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22713699"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/clpt.2012.54</pub-id>
          <pub-id pub-id-type="medline">22713699</pub-id>
          <pub-id pub-id-type="pii">clpt201254</pub-id>
          <pub-id pub-id-type="pmcid">PMC3685297</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lependu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Fairon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>Annotation analysis for testing drug safety signals using unstructured clinical notes</article-title>
          <source>J Biomed Semantics</source>
          <year>2012</year>
          <month>04</month>
          <day>24</day>
          <volume>3</volume>
          <issue>Suppl 1</issue>
          <fpage>S5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/2041-1480-3-S1-S5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/2041-1480-3-S1-S5</pub-id>
          <pub-id pub-id-type="medline">22541596</pub-id>
          <pub-id pub-id-type="pii">2041-1480-3-S1-S5</pub-id>
          <pub-id pub-id-type="pmcid">PMC3337270</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>LePendu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer-Mehren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mortensen</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Podchiyska</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ferris</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>Pharmacovigilance using clinical notes</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2013</year>
          <month>06</month>
          <volume>93</volume>
          <issue>6</issue>
          <fpage>547</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23571773"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/clpt.2013.47</pub-id>
          <pub-id pub-id-type="medline">23571773</pub-id>
          <pub-id pub-id-type="pii">clpt201347</pub-id>
          <pub-id pub-id-type="pmcid">PMC3846296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Banda</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vanguri</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>A curated and standardized adverse drug event resource to accelerate drug safety research</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>10</day>
          <volume>3</volume>
          <fpage>160026</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27193236"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.26</pub-id>
          <pub-id pub-id-type="medline">27193236</pub-id>
          <pub-id pub-id-type="pii">sdata201626</pub-id>
          <pub-id pub-id-type="pmcid">PMC4872271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>DuMouchel</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Madigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Novel data-mining methodologies for adverse drug event discovery and analysis</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2012</year>
          <month>06</month>
          <volume>91</volume>
          <issue>6</issue>
          <fpage>1010</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22549283"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/clpt.2012.50</pub-id>
          <pub-id pub-id-type="medline">22549283</pub-id>
          <pub-id pub-id-type="pii">clpt201250</pub-id>
          <pub-id pub-id-type="pmcid">PMC3675775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Racoosin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Overhage</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hartzema</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Welebob</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Scarnecchia</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Woodcock</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Advancing the science for active surveillance: rationale and design for the observational medical outcomes partnership</article-title>
          <source>Ann Intern Med</source>
          <year>2010</year>
          <month>11</month>
          <day>2</day>
          <volume>153</volume>
          <issue>9</issue>
          <fpage>600</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-153-9-201011020-00010</pub-id>
          <pub-id pub-id-type="medline">21041580</pub-id>
          <pub-id pub-id-type="pii">153/9/600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ginn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nikfarjam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Upadhaya</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Utilizing social media data for pharmacovigilance: a review</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <month>04</month>
          <volume>54</volume>
          <fpage>202</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00036-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.02.004</pub-id>
          <pub-id pub-id-type="medline">25720841</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00036-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC4408239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nikfarjam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ginn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>05</month>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>671</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25755127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id>
          <pub-id pub-id-type="medline">25755127</pub-id>
          <pub-id pub-id-type="pii">ocu041</pub-id>
          <pub-id pub-id-type="pmcid">PMC4457113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freifeld</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Menone</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Filice</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kass-Hout</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Digital drug safety surveillance: monitoring pharmaceutical products in Twitter</article-title>
          <source>Drug Saf</source>
          <year>2014</year>
          <month>05</month>
          <volume>37</volume>
          <issue>5</issue>
          <fpage>343</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24777653"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-014-0155-x</pub-id>
          <pub-id pub-id-type="medline">24777653</pub-id>
          <pub-id pub-id-type="pmcid">PMC4013443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tamang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Low</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Odgers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>LePendu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>Text mining for adverse drug events: the promise, challenges, and state of the art</article-title>
          <source>Drug Saf</source>
          <year>2014</year>
          <month>10</month>
          <volume>37</volume>
          <issue>10</issue>
          <fpage>777</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25151493"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-014-0218-z</pub-id>
          <pub-id pub-id-type="medline">25151493</pub-id>
          <pub-id pub-id-type="pmcid">PMC4217510</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Odgers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stiglic</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Analyzing search behavior of healthcare professionals for drug safety surveillance</article-title>
          <source>Biocomputing</source>
          <year>2014</year>
          <issue>2014</issue>
          <fpage>306</fpage>
          <lpage>317</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4299876/"/>
          </comment>
          <pub-id pub-id-type="doi">10.1142/9789814644730_0030</pub-id>
          <pub-id pub-id-type="pmcid">PMC4299876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>White</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>DuMouchel</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Toward enhanced pharmacovigilance using patient-generated data on the internet</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2014</year>
          <month>08</month>
          <volume>96</volume>
          <issue>2</issue>
          <fpage>239</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24713590"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/clpt.2014.77</pub-id>
          <pub-id pub-id-type="medline">24713590</pub-id>
          <pub-id pub-id-type="pii">clpt201477</pub-id>
          <pub-id pub-id-type="pmcid">PMC4111778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Woodcock</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lesko</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Pharmacological mechanism-based drug safety assessment and prediction</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2011</year>
          <month>06</month>
          <volume>89</volume>
          <issue>6</issue>
          <fpage>793</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1038/clpt.2011.55</pub-id>
          <pub-id pub-id-type="medline">21490594</pub-id>
          <pub-id pub-id-type="pii">clpt201155</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data-driven methods to discover molecular determinants of serious adverse drug events</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2009</year>
          <month>03</month>
          <volume>85</volume>
          <issue>3</issue>
          <fpage>259</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19177064"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/clpt.2008.274</pub-id>
          <pub-id pub-id-type="medline">19177064</pub-id>
          <pub-id pub-id-type="pii">clpt2008274</pub-id>
          <pub-id pub-id-type="pmcid">PMC2726746</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vilar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Harpaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chase</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Costanzi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rabadan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Facilitating adverse drug event detection in pharmacovigilance databases using molecular structure similarity: application to rhabdomyolysis</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <month>12</month>
          <volume>18</volume>
          <issue>Suppl 1</issue>
          <fpage>i73</fpage>
          <lpage>80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21946238"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000417</pub-id>
          <pub-id pub-id-type="medline">21946238</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000417</pub-id>
          <pub-id pub-id-type="pmcid">PMC3241177</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
          </person-group>
          <article-title>2010 i2b2/VA challenge on concepts, assertions, and relations in clinical text</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>552</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21685143"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000203</pub-id>
          <pub-id pub-id-type="medline">21685143</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000203</pub-id>
          <pub-id pub-id-type="pmcid">PMC3168320</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tonning</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Overview of the TAC 2017 Adverse Reaction Extraction from Drug Labels Track</article-title>
          <source>Semantic Scholar</source>
          <year>2017</year>
          <access-date>2020-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pdfs.semanticscholar.org/5b8a/7b11b987ddeb865dbf3aaa7b745a86ea5bf0.pdf">https://pdfs.semanticscholar.org/5b8a/7b11b987ddeb865dbf3aaa7b745a86ea5bf0.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sciaky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mattingly</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wiegers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioCreative V CDR task corpus: a resource for chemical disease relation extraction</article-title>
          <source>Database (Oxford)</source>
          <year>2016</year>
          <volume>2016</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/database/article-lookup/doi/10.1093/database/baw068"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/baw068</pub-id>
          <pub-id pub-id-type="medline">27161011</pub-id>
          <pub-id pub-id-type="pii">baw068</pub-id>
          <pub-id pub-id-type="pmcid">PMC4860626</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jagannatha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Overview of the first natural language processing challenge for extracting medication, indication, and adverse drug events from electronic health record notes (MADE 1.0)</article-title>
          <source>Drug Saf</source>
          <year>2019</year>
          <month>01</month>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>99</fpage>
          <lpage>111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30649735"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0762-z</pub-id>
          <pub-id pub-id-type="medline">30649735</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0762-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6860017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Buchan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Filannino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>2018 n2c2 shared task on adverse drug events and medication extraction in electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz166</pub-id>
          <pub-id pub-id-type="pii">5581277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>CD-REST: a system for extracting chemical-induced disease relation in literature</article-title>
          <source>Database (Oxford)</source>
          <year>2016</year>
          <volume>2016</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/database/article-lookup/doi/10.1093/database/baw036"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/baw036</pub-id>
          <pub-id pub-id-type="medline">27016700</pub-id>
          <pub-id pub-id-type="pii">baw036</pub-id>
          <pub-id pub-id-type="pmcid">PMC4808251</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Finkel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dingare</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Nissim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alex</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grover</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Exploring the boundaries: gene and protein identification in biomedical text</article-title>
          <source>BMC Bioinformatics</source>
          <year>2005</year>
          <volume>6</volume>
          <issue>Suppl 1</issue>
          <fpage>S5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-6-S1-S5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-6-S1-S5</pub-id>
          <pub-id pub-id-type="medline">15960839</pub-id>
          <pub-id pub-id-type="pii">1471-2105-6-S1-S5</pub-id>
          <pub-id pub-id-type="pmcid">PMC1869019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Mattingly</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wiegers</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Assessing the state of the art in biomedical relation extraction: overview of the BioCreative V chemical-disease relation (CDR) task</article-title>
          <source>Database (Oxford)</source>
          <year>2016</year>
          <volume>2016</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/database/article-lookup/doi/10.1093/database/baw032"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/baw032</pub-id>
          <pub-id pub-id-type="medline">26994911</pub-id>
          <pub-id pub-id-type="pii">baw032</pub-id>
          <pub-id pub-id-type="pmcid">PMC4799720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gurulingappa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rajput</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fluck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann-Apitius</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Toldo</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Development of a benchmark corpus to support the automatic extraction of drug-related adverse effects from medical case reports</article-title>
          <source>J Biomed Inform</source>
          <year>2012</year>
          <month>10</month>
          <volume>45</volume>
          <issue>5</issue>
          <fpage>885</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(12)00061-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2012.04.008</pub-id>
          <pub-id pub-id-type="medline">22554702</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(12)00061-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sutton</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An introduction to conditional random fields</article-title>
          <source>FNT in Mach Learn</source>
          <year>2012</year>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>267</fpage>
          <lpage>373</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nowpublishers.com/article/Details/MAL-013"/>
          </comment>
          <pub-id pub-id-type="doi">10.1561/2200000013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andrew</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>An introduction to support vector machines and other kernel‐based learning methods</article-title>
          <source>Kybernetes</source>
          <year>2001</year>
          <month>02</month>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>103</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1108/k.2001.30.1.103.6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dandala</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Joopudi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Devarakonda</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug events detection in clinical notes by jointly modeling entities and relations using neural networks</article-title>
          <source>Drug Saf</source>
          <year>2019</year>
          <month>01</month>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>135</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0764-x</pub-id>
          <pub-id pub-id-type="medline">30649738</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0764-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tiryaki</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A study of deep learning approaches for medication and adverse drug event extraction from clinical text</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>13</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31135882"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz063</pub-id>
          <pub-id pub-id-type="medline">31135882</pub-id>
          <pub-id pub-id-type="pii">5499225</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Extraction of information related to adverse drug events from electronic health record notes: design of an end-to-end model based on deep learning</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>11</month>
          <day>26</day>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e12159</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/4/e12159/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12159</pub-id>
          <pub-id pub-id-type="medline">30478023</pub-id>
          <pub-id pub-id-type="pii">v6i4e12159</pub-id>
          <pub-id pub-id-type="pmcid">PMC6288593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ju</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An ensemble of neural models for nested adverse drug events and medication extraction with subwords</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31197355"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz075</pub-id>
          <pub-id pub-id-type="medline">31197355</pub-id>
          <pub-id pub-id-type="pii">5518594</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug event and medication extraction in electronic health records via a cascading architecture with different sequence labeling models and word embeddings</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>47</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz120</pub-id>
          <pub-id pub-id-type="medline">31334805</pub-id>
          <pub-id pub-id-type="pii">5537181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wunnava</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kakar</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rundensteiner</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug event detection from electronic health records using hierarchical recurrent neural networks with dual-level embedding</article-title>
          <source>Drug Saf</source>
          <year>2019</year>
          <month>01</month>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>113</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0765-9</pub-id>
          <pub-id pub-id-type="medline">30649736</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0765-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Alba</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
          </person-group>
          <article-title>Detecting adverse drug events with rapidly trained classification models</article-title>
          <source>Drug Saf</source>
          <year>2019</year>
          <month>01</month>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>147</fpage>
          <lpage>56</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30649737"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0763-y</pub-id>
          <pub-id pub-id-type="medline">30649737</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0763-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6373386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bjarnadottir</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Identifying relations of medications with adverse drug events using recurrent convolutional neural networks and gradient boosting</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>65</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz144</pub-id>
          <pub-id pub-id-type="medline">31504605</pub-id>
          <pub-id pub-id-type="pii">5555856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chalapathy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Borzeshi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Piccardi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Bidirectional LSTM-CRF for Clinical Concept Extraction</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <comment>epub ahead of print(1611.08373)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1611.08373"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jernite</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Character-Aware Neural Language Models</article-title>
          <source>Proceedings of the Thirtieth AAAI Conference on Artificial Intelligence</source>
          <year>2016</year>
          <conf-name>AAAI'16</conf-name>
          <conf-date>February 12-17, 2016</conf-date>
          <conf-loc>Phoenix, Arizona, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/AAAI/AAAI16/paper/viewFile/12489/12017"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A neural joint model for entity and relation extraction from biomedical text</article-title>
          <source>BMC Bioinformatics</source>
          <year>2017</year>
          <month>03</month>
          <day>31</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>198</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-017-1609-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-017-1609-9</pub-id>
          <pub-id pub-id-type="medline">28359255</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-017-1609-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5374588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Multitask learning</article-title>
          <source>Mach Learn</source>
          <year>1997</year>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>41</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1007/978-1-4615-5529-2_5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bahdanau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Neural Machine Translation by Jointly Learning to Align and Translate</article-title>
          <source>Proceedings of the 3rd International Conference for Learning Representations</source>
          <year>2015</year>
          <conf-name>ICLR'15</conf-name>
          <conf-date>May 7-9, 2015</conf-date>
          <conf-loc>San Diego, CA, USA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>Adv Neural Inf Process Syst</source>
          <year>2017</year>
          <fpage>5998</fpage>
          <lpage>6008</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1706.03762"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Gated Self-Matching Networks for Reading Comprehension and Question Answering</article-title>
          <source>Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics</source>
          <year>2017</year>
          <conf-name>ACL'17</conf-name>
          <conf-date>July 30-August 4, 2017</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/p17-1018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Attention-based bidirectional long short-term memory networks for relation classification</article-title>
          <source>54th Annu Meet Assoc Comput Linguist ACL</source>
          <year>2016</year>
          <volume>2</volume>
          <fpage>207</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/P16-2034.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/p16-2034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Angeli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Position-Aware Attention and Supervised Data Improve Slot Filling</article-title>
          <source>Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2017</year>
          <conf-name>EMNLP'17</conf-name>
          <conf-date>September 7-11, 2017</conf-date>
          <conf-loc>Copenhagen, Denmark</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/d17-1004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>She</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Joint Extraction of Entities and Overlapping Relations Using Position-Attentive Sequence Labeling</article-title>
          <source>Proceedings of the AAAI Conference on Artificial Intelligence</source>
          <year>2019</year>
          <conf-name>Proc AAAI Conf Artif Intell ;33</conf-name>
          <conf-date>January 27-February 1, 2019</conf-date>
          <conf-loc>Honolulu, Hawaii, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1609/aaai.v33i01.33016300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Christopoulou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sahu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug events and medication relation extraction in electronic health records with ensemble deep learning methods</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>39</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31390003"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz101</pub-id>
          <pub-id pub-id-type="medline">31390003</pub-id>
          <pub-id pub-id-type="pii">5544735</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Knowledge-guided convolutional networks for chemical-disease relation extraction</article-title>
          <source>BMC Bioinformatics</source>
          <year>2019</year>
          <month>05</month>
          <day>21</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>260</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-019-2873-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-019-2873-7</pub-id>
          <pub-id pub-id-type="medline">31113357</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-019-2873-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6528333</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Si</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A Neural Multi-digraph Model for Chinese NER with Gazetteers</article-title>
          <source>Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics</source>
          <year>2019</year>
          <conf-name>ACL'19</conf-name>
          <conf-date>July 28-August 2, 2019</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/P19-1141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Knowledge-Aware Attentive Neural Network for Ranking Question Answer Pairs</article-title>
          <source>The 41st International ACM SIGIR Conference on Research &#38; Development in Information Retrieval</source>
          <year>2018</year>
          <conf-name>SIGIR'18</conf-name>
          <conf-date>July 8-12, 2018</conf-date>
          <conf-loc>Ann Arbor, Michigan</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3209978.3210081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Improving Relation Extraction with Knowledge-Attention</article-title>
          <source>Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing</source>
          <year>2019</year>
          <conf-name>EMNLP-IJCNLP'19</conf-name>
          <conf-date>November 3-7, 2019</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/D19-1022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bordes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Usunier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Durán</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weston</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yakhnenko</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Translating Embeddings for Modeling Multi-Relational Data</article-title>
          <source>Proceedings of the 26th International Conference on Neural Information Processing Systems</source>
          <year>2013</year>
          <conf-name>NIPS'13</conf-name>
          <conf-date>December 5-10, 2013</conf-date>
          <conf-loc>Lake Tahoe, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://papers.nips.cc/paper/5071-translating-embeddings-for-modeling-multi-relational-data"/>
          </comment>
          <pub-id pub-id-type="doi">10.5555/2999792.2999923</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Knowledge Graph Embedding by Translating on Hyperplanes</article-title>
          <source>Proceedings of the Twenty-Eighth AAAI Conference on Artificial Intelligence</source>
          <year>2014</year>
          <conf-name>AAAI'14</conf-name>
          <conf-date>July 27-31, 2014</conf-date>
          <conf-loc>Québec City, Québec, Canada</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://persagen.com/files/misc/wang2014knowledge.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Learning Entity and Relation Embeddings for Knowledge Graph Completion</article-title>
          <source>Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence</source>
          <year>2015</year>
          <conf-name>AAAI'15</conf-name>
          <conf-date>January 25-30, 2015</conf-date>
          <conf-loc>Austin, Texas, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/AAAI/AAAI15/paper/viewFile/9571/9523"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perozzi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Rfou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Skiena</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>DeepWalk: Online Learning of Social Representations</article-title>
          <source>Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2014</year>
          <conf-name>KDD'14</conf-name>
          <conf-date>August 24-27, 2014</conf-date>
          <conf-loc>New York, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2623330.2623732</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grover</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leskovec</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>node2vec: Scalable Feature Learning for Networks</article-title>
          <source>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <conf-name>KDD'18</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2939672.2939754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>LINE: Large-Scale Information Network Embedding</article-title>
          <source>Proceedings of the 24th International Conference on World Wide Web</source>
          <year>2015</year>
          <conf-name>WWW'15</conf-name>
          <conf-date>May 18-22, 2015</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2736277.2741093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>BiNE: Bipartite Network Embedding</article-title>
          <source>The 41st International ACM SIGIR Conference on Research &#38; Development in Information Retrieval</source>
          <year>2018</year>
          <conf-name>SIGIR'18</conf-name>
          <conf-date>July 8-12, 2018</conf-date>
          <conf-loc>Ann Arbor, Michigan</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3209978.3209987</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Extracting medications and associated adverse drug events using a natural language processing system combining knowledge base and deep learning</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz141</pub-id>
          <pub-id pub-id-type="medline">31591641</pub-id>
          <pub-id pub-id-type="pii">5582687</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>NLTK: The Natural Language Toolkit</source>
          <year>2002</year>
          <access-date>2020-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nltk.org/">https://www.nltk.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Honnibal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Montani</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>spaCy v2</article-title>
          <source>GitHub</source>
          <year>2017</year>
          <access-date>2020-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/explosion/spaCy/issues/1555">https://github.com/explosion/spaCy/issues/1555</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Surdeanu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Finkel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McClosky</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The Stanford coreNLP natural language processing toolkit</article-title>
          <source>Assoc Comput Linguist Syst Demonstr</source>
          <year>2014</year>
          <fpage>60</fpage>
          <pub-id pub-id-type="doi">10.3115/v1/p14-5010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Khare</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Challenges in clinical natural language processing for automated disorder normalization</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <month>10</month>
          <volume>57</volume>
          <fpage>28</fpage>
          <lpage>37</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00150-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.07.010</pub-id>
          <pub-id pub-id-type="medline">26187250</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00150-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4713367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Distributed Representations of Words and Phrases and their Compositionality</article-title>
          <source>NIPS Proceedings</source>
          <year>2013</year>
          <access-date>2020-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf">https://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pennington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>GloVe: Global Vectors for Word Representation</article-title>
          <source>Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2014</year>
          <conf-name>EMNLP'14</conf-name>
          <conf-date>October 25-29, 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joulin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grave</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bojanowski</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Bag of Tricks for Efficient Text Classification</article-title>
          <source>Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics</source>
          <year>2017</year>
          <conf-name>EACL'17</conf-name>
          <conf-date>April 3-7, 2017</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/e17-2068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Karimi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hachey</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Paris</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using Similarity Measures to Select Pretraining Data for NER</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2019</year>
          <conf-name>NAACL'19</conf-name>
          <conf-date>July 5-10, 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota</conf-loc>
          <fpage>1460</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/N19-1149/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1149</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iyyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Deep Contextualized Word Representations</article-title>
          <source>Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2018</year>
          <conf-name>MAACL'18</conf-name>
          <conf-date>June 1-6, 2018</conf-date>
          <conf-loc>New Orleans, Louisiana</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/n18-1202</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: Pre-Training of Deep Bidirectional Transformers for Language Understanding</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2019</year>
          <conf-name>NAACL'19</conf-name>
          <conf-date>June 2-7, 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Si</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Enhancing clinical concept extraction with contextual embeddings</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>1</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>1297</fpage>
          <lpage>304</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz096</pub-id>
          <pub-id pub-id-type="medline">31265066</pub-id>
          <pub-id pub-id-type="pii">5527248</pub-id>
          <pub-id pub-id-type="pmcid">PMC6798561</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The unified medical language system (UMLS): integrating biomedical terminology</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <month>01</month>
          <day>1</day>
          <volume>32</volume>
          <issue>Database issue</issue>
          <fpage>D267</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14681409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
          <pub-id pub-id-type="medline">14681409</pub-id>
          <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
          <pub-id pub-id-type="pmcid">PMC308795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Bidirectional LSTM-CRF models for sequence tagging</article-title>
          <source>arXiv</source>
          <year>2015</year>
          <comment>epub ahead of print(1508.01991)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1508.01991"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Relation Classification via Convolutional Deep Neural Network</article-title>
          <source>Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers</source>
          <year>2014</year>
          <conf-name>COLING'14</conf-name>
          <conf-date>August 23-29, 2014</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/C14-1220/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edgington</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Approximate randomization tests</article-title>
          <source>J Psychol Interdiscip Appl</source>
          <year>1969</year>
          <month>07</month>
          <volume>72</volume>
          <issue>2</issue>
          <fpage>143</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1080/00223980.1969.10543491</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseinmardi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrara</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Galstyan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Capturing edge attributes via network embedding</article-title>
          <source>IEEE Trans Comput Soc Syst</source>
          <year>2018</year>
          <month>12</month>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>907</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1109/tcss.2018.2877083</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joopudi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Dandala</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Devarakonda</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A convolutional route to abbreviation disambiguation in clinical text</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <month>10</month>
          <volume>86</volume>
          <fpage>71</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30155-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.07.025</pub-id>
          <pub-id pub-id-type="medline">30118854</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30155-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Quirk</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yih</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Cross-sentence n-ary relation extraction with graph LSTMs</article-title>
          <source>Transact Assoc Comput Ling</source>
          <year>2017</year>
          <volume>-</volume>
          <fpage>101</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00049</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
