<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i4e18323</article-id>
      <article-id pub-id-type="pmid">32343247</article-id>
      <article-id pub-id-type="doi">10.2196/18323</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Knowledge Graph of Combined Drug Therapies Using Semantic Predications From Biomedical Literature: Algorithm Development</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Xing</surname>
            <given-names>Zhaopeng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Su</surname>
            <given-names>Wu-Chen</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Du</surname>
            <given-names>Jian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7621-9995</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Xiaoying</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Institute of Medical Information</institution>
            <institution>Chinese Academy of Medical Sciences</institution>
            <addr-line>No 69, Dongdan North Street</addr-line>
            <addr-line>Dongcheng District</addr-line>
            <addr-line>Beijing, 100005</addr-line>
            <country>China</country>
            <phone>86 10 52328792</phone>
            <email>lixiaoying@imicams.ac.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4407-6616</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>National Institute of Health Data Science</institution>
        <institution>Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Institute of Medical Information</institution>
        <institution>Chinese Academy of Medical Sciences</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xiaoying Li <email>lixiaoying@imicams.ac.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>28</day>
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>4</issue>
      <elocation-id>e18323</elocation-id>
      <history>
        <date date-type="received">
          <day>21</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>3</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>26</day>
          <month>3</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>3</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Jian Du, Xiaoying Li. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 28.04.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2020/4/e18323/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Combination therapy plays an important role in the effective treatment of malignant neoplasms and precision medicine. Numerous clinical studies have been carried out to investigate combination drug therapies. Automated knowledge discovery of these combinations and their graphic representation in knowledge graphs will enable pattern recognition and identification of drug combinations used to treat a specific type of cancer, improve drug efficacy and treatment of human disorders.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This paper aims to develop an automated, visual approach to discover knowledge about combination therapies from biomedical literature, especially from those studies with high-level evidence such as clinical trial reports and clinical practice guidelines.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Based on semantic predications, which consist of a triple structure of subject-predicate-object (SPO), we proposed an automated algorithm to discover knowledge of combination drug therapies using the following rules: 1) two or more semantic predications (S<sub>1</sub>-P-O and S<sub>i</sub>-P-O, i = 2, 3…) can be extracted from one conclusive claim (sentence) in the abstract of a given publication, and 2) these predications have an identical predicate (that closely relates to human disease treatment, eg, “treat”) and object (eg, disease name) but different subjects (eg, drug names). A customized knowledge graph organizes and visualizes these combinations, improving the traditional semantic triples. After automatic filtering of broad concepts such as “pharmacologic actions” and generic disease names, a set of combination drug therapies were identified and characterized through manual interpretation.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We retrieved 22,263 clinical trial reports and 31 clinical practice guidelines from PubMed abstracts by searching “antineoplastic agents” for drug restriction (published between Jan 2009 and Oct 2019). There were 15,603 conclusive claims locally parsed using the search terms “conclusion*” and “conclude*” ready for semantic predications extraction by SemRep, and 325 candidate groups of semantic predications about combined medications were automatically discovered within 316 conclusive claims. Based on manual analysis, we determined that 255/316 claims (78.46%) were accurately identified as describing combination therapies and adopted these to construct the customized knowledge graph. We also identified two categories (and 4 subcategories) to characterize the inaccurate results: limitations of SemRep and limitations of proposal. We further learned the predominant patterns of drug combinations based on mechanism of action for new combined medication studies and discovered 4 obvious markers (“combin*,” “coadministration,” “co-administered,” and “regimen”) to identify potential combination therapies to enable development of a machine learning algorithm.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Semantic predications from conclusive claims in the biomedical literature can be used to support automated knowledge discovery and knowledge graph construction for combination therapies. A machine learning approach is warranted to take full advantage of the identified markers and other contextual features.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>combined drug therapy</kwd>
        <kwd>knowledge graph</kwd>
        <kwd>knowledge discovery</kwd>
        <kwd>semantic predications</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Combination drug therapy is a therapeutic intervention in which multiple drugs are administered, particularly in patients with malignant neoplasms [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Compared with single-agent therapy, the synergistic interaction of combined medications significantly improves drug efficacy, shortens disease course, delays or avoids drug resistance, and reduces both toxicity and other side effects without loss of efficacy. The combination of several existing drugs with compatible mechanisms of action has been reported as an alternative approach to advance the success of drug repositioning [<xref ref-type="bibr" rid="ref3">3</xref>]. The characteristics of combination therapies make them a practical alternative to standard approaches, with the potential to save billions of dollars on research and development of new drugs, particularly in the absence of effective monotherapies for many types of cancer and other diseases (such as autoimmune and psychiatric conditions), and more than 6700 rare diseases for which no therapies are available [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>In recent decades, massive efforts have been made to employ combined therapeutic agents to improve treatment of human disorders such as specific cancers [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>], malignancies such as lymphocytic leukemia [<xref ref-type="bibr" rid="ref1">1</xref>], and hypertension [<xref ref-type="bibr" rid="ref5">5</xref>]. PubMed houses over 175,000 publications found by searching the MeSH (Medical Subject Headings) heading “Drug Therapy, Combination” (Jan 2009 to Oct 2019). We used innovative information retrieval and semantic web technologies to discover knowledge about therapeutic drug combinations, then presented the findings in a visually intuitive knowledge graph. The resulting knowledge graph will not only support machine-understandable information for curing disease and drug efficacy screening, but also provide insights to quickly develop new therapies for untreated diseases.</p>
        <p>In this paper, we propose a systematic, automated approach to discover knowledge about combination drug therapies in the biomedical literature (especially clinical trial reports and clinical practice guidelines with high evidence levels), and integrate the findings into knowledge graphs with customized organization and visualization. This entails the following:</p>
        <list list-type="order">
          <list-item>
            <p>Propose an automated algorithm to discover knowledge about combination drug therapies based on semantic predications extracted from conclusive claims in biomedical literature</p>
          </list-item>
          <list-item>
            <p>Customize a knowledge graph to emphasize the specified drugs being combined rather than traditional triples (eg, one drug TREATS one disease)</p>
          </list-item>
          <list-item>
            <p>Retrieve published clinical trial reports and clinical practice guidelines for algorithm verification and validation, followed by manual identification of accurate knowledge about combination drug therapies, as well as interpretation of inaccurate findings</p>
          </list-item>
          <list-item>
            <p>Characterize the major patterns of combinations according to mechanism of action for new combined medication studies and identify potential markers as key features for machine learning-based drug combination discovery.</p>
          </list-item>
        </list>
        <p>In the following sections, we review related work on knowledge graphs and drug-disease knowledge discovery. We then present our methodology to develop an automated algorithm to discover knowledge about combination drug therapies. A large number of clinical trial reports and clinical practice guidelines were retrieved from PubMed for algorithm verification and validation, followed by manual biocuration to verify accurate results for knowledge graph construction and to interpret inaccurate results. In the discussion we characterize the main patterns of drug combinations according to their mechanisms of action to inform new combination studies and identify markers of potential combined drug therapies to inform machine learning–based algorithm development.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <sec>
          <title>Knowledge Graph</title>
          <p>A knowledge graph is a network-based representation of the semantic relationship between entities. Its principles have been developed by industry and academia, particularly by the semantic web community. In 1982, Hoede and Stokman used large graphs to represent knowledge extracted from medical and sociology texts [<xref ref-type="bibr" rid="ref6">6</xref>], resulting in an expert system for quick searching and decision support for automated queries. In 2012, Google formally introduced their knowledge graph after compiling over 3.5 billion facts and relationships among 500 million objects, which is essentially a semantic enhancement of the search engine to help search real-world objects quickly and easily. At the end of 2016, Microsoft announced a large graph of concepts harnessed from billions of web pages and search logs for short text understanding, called the Concept Graph. Other frequently mentioned applications are Yahoo Spark, Facebook’s entity graph, Wikidata, Freebase, Baidu’s Knowledge Graph, and Sogou’s Knowledge Cube. Although these products differ in their architecture, operational purpose, and supported technologies, they constitute a family of knowledge graphs and together represent the precursor to a new generation of semantic search and knowledge discovery.</p>
          <p>Many other studies on biomedical knowledge graphs have been performed since 2012, playing an indispensable role in biomedical knowledge services. Remarkable achievements encompass the organization of health information from heterogeneous textual [<xref ref-type="bibr" rid="ref7">7</xref>], disease-symptom association learning from electronic medical records [<xref ref-type="bibr" rid="ref8">8</xref>], presenting relationships between cells and cytokines [<xref ref-type="bibr" rid="ref9">9</xref>], extraction of human disorder biomarkers [<xref ref-type="bibr" rid="ref10">10</xref>], and predicting drug efficacy [<xref ref-type="bibr" rid="ref11">11</xref>]. However, knowledge graphs have not yet been applied to organize and manage biomedical information related to combination drug therapies, especially when such knowledge comes from the direct empirical evidence of clinical research.</p>
        </sec>
        <sec>
          <title>Biomedical Drug-Disease Knowledge Discovery</title>
          <p>Studies on biomedical knowledge discovery mainly focus on the semantic relationships, associations, and interactions between biomedical entities such as diseases, drugs, signs or symptoms, target organ, genes, biomarkers, and targets. One of the most important tasks is to identify the exact relationship between a drug and disease, especially for “treatment.” Many information retrieval techniques and methods have been used to approach this problem based on predefined rules [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>] or natural language processing [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref19">19</xref>] combined with machining learning [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. Although predefined rules offer promising precision from biomedical texts, they are insufficient and perform poorly when parsing big data due to the noisy and variable syntactic structures within large-scale scientific texts. In comparison, natural language processing-based algorithms have generally been more successful and relatively flexible by virtue of features that parse context in literature.</p>
          <p>Semantic Knowledge Representation, or SemRep, is a natural language processing tool based on the Unified Medical Language System (UMLS) [<xref ref-type="bibr" rid="ref20">20</xref>]. This high-quality tool for extracted semantic predication has already been utilized for a broad range of applications such as the construction of a biomedical knowledge graph [<xref ref-type="bibr" rid="ref21">21</xref>], identification of apparent contradictions [<xref ref-type="bibr" rid="ref22">22</xref>], labeling for semantic relationships [<xref ref-type="bibr" rid="ref23">23</xref>], and detection of drug-drug interactions [<xref ref-type="bibr" rid="ref24">24</xref>] or drug-gene targets [<xref ref-type="bibr" rid="ref25">25</xref>]. Here, we extend the application scope of SemRep by using semantic predications from conclusive sentences (eg, the conclusion section) of abstracts in biomedical literature, rather than the whole abstract, to automatically discover knowledge about combination drug therapies. The conclusion statement of a paper is the essential knowledge unit that synthesizes the knowledge content of an article and is validated by the experiment reported within the article.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Using Conclusive Sentences in the Abstract of a Publication as Knowledge Claims</title>
        <p>There is a vast amount of published biomedical literature easily available in digital and printed format due to the rapid advance of information technology. For example, the cumulative citations of PubMed resources have exceeded 25 million, expanding with an annual growth of 0.9 million [<xref ref-type="bibr" rid="ref26">26</xref>]. The huge amount of literature encourages the emergence of automated knowledge discovery, which could help scientists keep up with the latest scientific developments and academic achievements.</p>
        <p>Scientific publications can be considered records of knowledge claims on a research question, supported by empirical evidence. These knowledge claims are often succinctly described in the abstract of a publication. The abstract is the most frequently accessed section of a publication and the only section used as source information in indexing databases such as PubMed. In this study, we parsed abstracts from PubMed for conclusive claims identified by the key words “conclusion*” and “conclude*” (<xref ref-type="table" rid="table1">Table 1</xref>) in order to discover knowledge about combination drug therapies.</p>
      </sec>
      <sec>
        <title>Semantic Predication Interpretation Using SemRep</title>
        <p>SemRep is a well-developed semantic knowledge interpreter that retrieves semantic predications (in terms of subject-predicate-object) to extract information from biomedical texts. For example, for the first claim in <xref ref-type="table" rid="table1">Table 1</xref>, SemRep would interpret the 7 semantic predications shown in <xref ref-type="table" rid="table2">Table 2</xref>, and the predications with “INFER” in the predicate was inferred based on two existing predications.</p>
        <p>As a natural language processing driven tool, SemRep takes full advantage of UMLS knowledge sources including the Metathesaurus and Semantic Network. Briefly, the subject and object of semantic predication returned by SemRep are the preferred names of biomedical concepts in the UMLS Metathesaurus, while the predicates were derived from semantic relationships in the UMLS Semantic Network. An evaluation based on sample data with semantic type “Chemicals and Drugs” has allowed SemRep to achieve a promising degree of precision (83%) [<xref ref-type="bibr" rid="ref20">20</xref>], which will contribute to the development of algorithms for automated knowledge discovery for combination drug therapy.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Examples of conclusive claims from PubMed abstracts.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="200"/>
            <col width="800"/>
            <thead>
              <tr valign="bottom">
                <td>PMID_Ab<sup>a</sup></td>
                <td>Claim</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>19322566.ab.15</td>
                <td><italic>CONCLUSION</italic>: A combination of GTI-2040, capecitabine and oxaliplatin is feasible in patients with advanced solid tumors.</td>
              </tr>
              <tr valign="top">
                <td>28101592.ab.10</td>
                <td>In <italic>conclusion</italic>, FCM regimen allows excellent long-lasting response in previously untreated patients with FL.</td>
              </tr>
              <tr valign="top">
                <td>21198717.ab.10</td>
                <td>WHAT IS NEW AND <italic>CONCLUSION</italic>: The use of novel agents such as thalidomide, bortezomib and lenalidomide for RRMM is highly prevalent in France from the first relapse.</td>
              </tr>
              <tr valign="top">
                <td>23197589.ab.8</td>
                <td>We <italic>conclude</italic> that intraventricular rituximab in combination with MTX is feasible and highly active in the treatment of drug-resistant CNS NHL that is refractory or unresponsive to IV rituximab.</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>PMID_Ab: PubMed reference number, abstract, sentence in which the information appears.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Examples of SemRep semantic predications based on a biomedical claim.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="270"/>
            <col width="0"/>
            <col width="300"/>
            <col width="0"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Example claim</td>
                <td colspan="2">Predicate</td>
                <td>Object</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>19322566.ab.15 CONCLUSION: A combination of <italic>GTI-2040</italic>, <italic>capecitabine</italic> and <italic>oxaliplatin</italic> is feasible in patients with <italic>advanced solid tumors</italic>.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="7">
                  <break/>
                </td>
                <td>Advanced Malignant Solid Neoplasm</td>
                <td colspan="2">PROCESS_OF</td>
                <td colspan="2">Patients</td>
              </tr>
              <tr valign="top">
                <td>GTI2040</td>
                <td colspan="2">TREATS</td>
                <td colspan="2">Patients</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>GTI2040</italic>
                </td>
                <td colspan="2">
                  <italic>TREATS(INFER)</italic>
                </td>
                <td colspan="2">
                  <italic>Advanced Malignant Solid Neoplasm</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>capecitabine</td>
                <td colspan="2">TREATS</td>
                <td colspan="2">Patients</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>capecitabine</italic>
                </td>
                <td colspan="2">
                  <italic>TREATS(INFER)</italic>
                </td>
                <td colspan="2">
                  <italic>Advanced Malignant Solid Neoplasm</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>oxaliplatin</td>
                <td colspan="2">TREATS</td>
                <td colspan="2">Patients</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>oxaliplatin</italic>
                </td>
                <td colspan="2">
                  <italic>TREATS(INFER)</italic>
                </td>
                <td colspan="2">
                  <italic>Advanced Malignant Solid Neoplasm</italic>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Development of an Algorithm for Discovering Knowledge About Combination Drug Therapy</title>
        <p>The UMLS-based SemRep underpins biomedical knowledge discovery applications with its broad coverage and high-quality extracted semantic predications. SemRep enables interpretation of 30 semantic predicates [<xref ref-type="bibr" rid="ref27">27</xref>], such as “PREVENTS,” “TREATS,” and “INHIBITS.”</p>
        <p>To develop our algorithm to automatically discover knowledge about combination drug therapies, we focused on 4 semantic predicates closely related to disease treatment: “TREATS,” “INHIBITS,” “PREVENTS,” and “DISRUPTS” (also inferences with “INFER” such as “TREATS(INFER)”). We also adopted the UMLS Semantic Types “Chemicals and Drugs,” “Disease or Syndrome,” and their child types to restrict the subject and object of SemRep output to drug and disease.</p>
        <p>Knowledge about combined drug therapy is detected under the hypothesis that (1) two or more semantic predications (S<sub>1</sub>-P-O and S<sub>i</sub>-P-O, i=2, 3...) are extracted from one conclusive claim in the abstract of a given biomedical publication, and (2) they have an identical object (eg, disease) and predicate (eg, treats) but different subjects (eg, drugs). Referring again to the example used in <xref ref-type="table" rid="table2">Table 2</xref>, the method provided straightforward discovery of the combined medication knowledge “GTI2040+capecitabine+oxaliplatin-TREATS-Advanced Malignant Solid Neoplasm.”</p>
        <p>Generally, the algorithm could be expressed by the following formula (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>):</p>
        <boxed-text id="box1" position="float">
          <title>Algorithm text.</title>
          <p><bold>Algorithm:</bold> Drug combination knowledge discovery</p>
          <p><bold>Input:</bold> Semantic predications S<sub>1</sub>-P-O and S<sub>i</sub>-P-O (i=2, 3...) from one conclusive claim in a biomedical abstract</p>
          <p><bold>Output:</bold> Combined drug therapy knowledge S<sub>1</sub>+S<sub>i</sub>-P-O, where all of the following conditions are satisfied:</p>
          <list list-type="order">
            <list-item>
              <p>P∈{TREATS”,“INHIBITS”,“PREVENTS”,“DISRUPTS”}</p>
            </list-item>
            <list-item>
              <p>S<sub>1</sub>∈Chemicals and Drugs</p>
            </list-item>
            <list-item>
              <p>S<sub>i</sub>∈Chemicals and Drugs, i≥2</p>
            </list-item>
            <list-item>
              <p>O∈Disease</p>
            </list-item>
          </list>
          <p/>
        </boxed-text>
      </sec>
      <sec>
        <title>Automated Filtering to Focus on Specific Drug and Disease Names</title>
        <p>Knowledge about combined drug therapies primarily pertains to specified drugs and diseases; thus, the generic names of these biomedical entities should be filtered out automatically.</p>
      </sec>
      <sec>
        <title>Filtering out Pharmacologic Actions</title>
        <p>In the biomedical domain, the phrase “pharmacologic actions” stands for a broad category of chemical actions and uses that result in the prevention, treatment, cure, or diagnosis of disease. Typical subclasses include “Antineoplastic Agents,” “Lipid Regulating Agents,” and “Anti-Inflammatory Agents”. In the UMLS Metathesaurus, these terms and phrases have been assigned the semantic type “Chemicals and Drugs” and several child types, which would not differ with the specific drug name for our study. To selectively filter out these pharmacologic actions, 497 headings from the MeSH thesaurus were systematically collected based on the tree structure shown in <xref rid="figure1" ref-type="fig">Figure 1</xref> (left).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Automatic filtering of pharmacologic actions (left) and generic disease names (right).</p>
          </caption>
          <graphic xlink:href="medinform_v8i4e18323_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Filtering out the Generic Names of Diseases</title>
        <p>The top-level names of diseases were automatically filtered by disease (class C in the MeSH tree structure) and its direct hyponyms with tree number from C01 to C26, totaling 27 terms. This filtering was applied because the terms are better regarded as classes of disorders rather than specific diseases (<xref rid="figure1" ref-type="fig">Figure 1</xref> [right]).</p>
      </sec>
      <sec>
        <title>The Construction and Visualization of Knowledge Graph About Combined Drug Therapy</title>
        <p>The knowledge graph is an evolving technology widely used for massive knowledge organization and presentation in the era of big data and artificial intelligence due to its ability to mine machine-understandable knowledge and information. In terms of data structure and storage, knowledge graphs store knowledge in the form of subject-predicate-object (usually called a semantic triple). Traditionally, to visualize a domain knowledge graph, the subjects and objects of triples are intuitively displayed as nodes in a graph, with the predicates presented as various edges linked to subjects and objects accordingly.</p>
        <p>In this paper, to emphasize the combined drugs, knowledge about combined drug therapies (S<sub>1</sub>+S<sub>i</sub>)-P-O (i≥2) discovered by the proposed algorithm will be demonstrated such that the combined drugs will be first bound together and then directed to a specified disorder, while the supporting conclusive claims are shown on the right (<xref rid="figure2" ref-type="fig">Figure 2</xref>, left). Upon selecting the linked edge of interest, the specific claim regarding the combined medication will be amplified and highlighted (<xref rid="figure2" ref-type="fig">Figure 2</xref>, right). The JavaScript libraries Data-Driven Document (D<sup>3</sup>) [<xref ref-type="bibr" rid="ref28">28</xref>] was utilized to visualize the knowledge graph.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Customized knowledge graph visualization (left) and the conclusive claim being highlighted (right).</p>
          </caption>
          <graphic xlink:href="medinform_v8i4e18323_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p/>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data Acquisition and Experimental Setup</title>
        <p>A summary of the steps taken to discover and identify combined drug therapies is shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. We retrieved 22,263 clinical trial reports and 31 clinical practice guidelines of PubMed abstracts for algorithm verification and validation, with the subject majored on “antineoplastic agents” for drug restriction (Jan 2009 to Oct 2019). The following PubMed queries were used to identify clinical articles:</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Study design.</p>
          </caption>
          <graphic xlink:href="medinform_v8i4e18323_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <list list-type="order">
          <list-item>
            <p>Clinical trial reports: ((“clinical trial” [Publication Type] OR “clinical trial, phase I” [Publication Type] OR “clinical trial, phase ii” [Publication Type] OR “clinical trial, phase iii” [Publication Type] OR “clinical trial, phase iv” [Publication Type]) OR “clinical study” [Publication Type]).</p>
          </list-item>
          <list-item>
            <p>Clinical practice guidelines: “guideline” [Publication Type]</p>
          </list-item>
        </list>
        <p>Using the keywords “conclusion*” and “conclude*”, 15,603 conclusive claims were locally segmented and preserved, then pushed into the batch mode of SemRep for semantic predication extraction. Initially, there were 21,234 semantic predications extracted from 9700 conclusive claims, while 8484 predications had semantic predicates focusing on disease treatment (“TREATS,” “INHIBITS,” “PREVENTS,” and “DISRUPTS”). We then employed the automated algorithm to discover knowledge about combined drug therapies while automatically filtering out pharmacologic actions and generic disease names. As a result, 325 candidate groups of semantic predications about combined drug therapies were discovered from 316 conclusive claims for further analysis and characterization.</p>
      </sec>
      <sec>
        <title>Evaluation</title>
        <p>Two biocurators annotated 325 candidate groups of semantic predications about combined medications, which were automatically discovered by the algorithm based on SemRep’s semantic predications from 316 conclusive claims. The primary criteria of the biocuration process were that (1) the discovered drugs were combined to treat the specific disease in a given claim, and a single therapy should be identified; (2) the efficacy of combined therapeutic must be promising and negation was disallowed; and (3) the drug name and disease name should be properly recognized by SemRep. Both biocurators independently evaluated all the candidates groups and identified 255 and 239 combined drug therapies (agreement rate 93.73%). Their disagreements mainly lay in the SemRep object “advanced cancer,” which came from more specific terminal malignancies studied in the conclusive claims (such as “advanced carcinomas of the head and neck” in PMID [PubMed ID] 21947123). After consulting a biomedical scientist with specific clinical knowledge, we accepted this kind of text mapping, acknowledging that advanced cancers usually spread from where they started to other parts of the body. Eventually, 255 of 325 (78.46%) groups of semantic predications were identified to be accurate drug combinations (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), while 70 were determined to be inaccurate and further classified into 2 categories: limitations of SemRep and limitations of proposal.</p>
      </sec>
      <sec>
        <title>Knowledge Graph Construction Based on Identified Knowledge About Combined Medications</title>
        <p>Of the 255 identified combined drug therapies, 210 (82.35%) represented combinations of two drugs, 43 (16.86%) combined 3 agents, and 2 (0.78%) included 4 combined medications. These accurate drug combinations as well as their supporting claims were then used to build the knowledge graph based on customized data structure ((S<sub>1</sub>+S<sub>i</sub>)-P-O, i≥2). <xref rid="figure4" ref-type="fig">Figure 4</xref> shows a snapshot by searching for “Non-Small Cell Lung Carcinoma”.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Knowledge graph of combined drug therapies centered at “Non-Small Cell Lung Carcinoma”.</p>
          </caption>
          <graphic xlink:href="medinform_v8i4e18323_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Characteristics of Inaccurate Results</title>
        <p>There were 70 groups of semantic predications from the automated discovery which, upon manual inspection, were deemed inaccurate due to limitations of SemRep (25/70, 35.7%), or limitations of the proposed algorithm (45/70, 64.3%). These were further categorized to include Named Entity Recognition (NER; 8/70, 11.4%) and Semantic Predicate Extraction (SPR) error (17/70, 24.3%), as well as single therapy (40/70, 57.1%) or multiple combined therapies (5/70, 7.1%). <xref ref-type="table" rid="table3">Table 3</xref> summarizes the inaccurate results and their characteristics.</p>
      </sec>
      <sec>
        <title>Limitations of SemRep</title>
        <p>NER is one of the key tasks for knowledge discovery and information retrieval, usually implemented before SPR. In SemRep, NER will be executed by MetaMap, a highly configurable program mapping the biomedical entity to the UMLS Metathesaurus. However, due to the relatively limited coverage of the UMLS Metathesarus or the ambiguity of a given biomedical text, MetaMap may inadequately identify an entity, resulting in an improper semantic subject or object. For the first example in <xref ref-type="table" rid="table3">Table 3</xref>, “ED-SCLC” represents the abbreviation of “extensive-stage disease, small-cell lung cancer,” which is expected to map to “Small cell lung cancer extensive stage” (Concept Unique Identifier: C0278726), but not “Widespread Disease” (CUI: C0849867).</p>
        <p>SPR error is another example of SemRep imprecision. In particular, the keyword “failed” was sometimes ignored by SemRep when it appeared in a biomedical text (see the second example in <xref ref-type="table" rid="table3">Table 3</xref>), resulting in the semantic predicates “TREATS” instead of “NEG_TREATS.” To reduce frequency at which negative predications are extracted, we plan to preprocess conclusive claims to filter out negations before SemRep interpretation.</p>
      </sec>
      <sec>
        <title>Limitations of the Proposed Algorithm</title>
        <p>A majority (40/70, 57.1%) of inaccurate results from the automated algorithm were references to single therapies primarily in comparative clinical studies of two or more individual agents. SemRep’s predicate “COMPARED_WITH” may provide a means to filter out these predications. It is common for two or more combined drug therapies to be studied in one published clinical trial (the last claim in <xref ref-type="table" rid="table3">Table 3</xref>). Future work will focus on these issues to improve the performance of the proposed algorithm.</p>
        <p/>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Characteristics of inaccurate results from proposed automatic algorithm.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="30"/>
            <col width="250"/>
            <col width="100"/>
            <col width="300"/>
            <col width="320"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Explanation</td>
                <td>No.</td>
                <td>Example</td>
                <td>PMID_tx<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Limitations of SemRep</bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="2"/>
                <td>NER error</td>
                <td>8</td>
                <td>bevacizumab-TREATS-<italic>Widespread Disease</italic><break/>Cisplatin-TREATS-<italic>Widespread Disease</italic><break/>Etoposide-TREATS-<italic>Widespread Disease</italic></td>
                <td>19826110.ab.12 CONCLUSION: The addition of bevacizumab to cisplatin and etoposide in patients with <italic>ED-SCLC</italic> results in …</td>
              </tr>
              <tr valign="top">
                <td>SPR error</td>
                <td>17</td>
                <td>ASA 404-<italic>TREATS</italic>-Non-Small Cell Lung Carcinoma<break/>Carboplatin-<italic>TREATS</italic>-Non-Small Cell Lung Carcinoma<break/>Paclitaxel-<italic>TREATS</italic>-Non-Small Cell Lung Carcinoma</td>
                <td>21709202.ab.11 CONCLUSION: The addition of ASA404 to carboplatin and paclitaxel, although generally well tolerated, <italic>failed</italic> to improve frontline efficacy in advanced NSCLC.</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Limitations of proposal</bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="2"/>
                <td>Single Therapy</td>
                <td>40</td>
                <td>pemetrexed-TREATS-Non-small cell lung cancer metastatic<break/>erlotinib-TREATS-Non-small cell lung cancer metastatic</td>
                <td>23661337.ab.9 CONCLUSION: Both pemetrexed and erlotinib had <italic>comparable</italic> efficacy in pre-treated patients with metastatic NSCLC.</td>
              </tr>
              <tr valign="top">
                <td>Multiple combined therapies</td>
                <td>5</td>
                <td>Custirsen-TREATS-Hormone refractory prostate cancer<break/>docetaxel-TREATS-Hormone refractory prostate cancer<break/>Mitoxantrone-TREATS-Hormone refractory prostate cancer</td>
                <td>21788353.ab.15 CONCLUSION: Custirsen plus <italic>either</italic> docetaxel <italic>or</italic> mitoxantrone was feasible in patients with progressive mCRPC following first-line docetaxel therapy.</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>PMID_tx: PubMed identifier, abstract, sentence number, and associated text</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Major Patterns of Combinations According to the Mechanisms of Drugs Being Combined</title>
        <p>Among 255 identified combined drug therapies, there were 142 specific drugs after duplicate removal. Classifying by mechanism, 125/142 (88.03%) are antineoplastic agents with 46/142 (32.39%) cytotoxic drugs, 59/142 (41.55%) targeted drugs, 11/142 (7.75%) immunotherapies, 3/142 (2.11%) hormonal drugs, and 6/142 (4.23%) other antineoplastic agents or adjuvant drugs.</p>
        <p>We investigated the patterns of identified knowledge based on the mechanism of antineoplastic agents and counted the number of drug combinations under each pattern (<xref ref-type="table" rid="table4">Table 4</xref>). Although there were fewer cytotoxic drugs than targeted agents, the most common pattern (68/255, 26.67%) were combinations of two cytotoxic drugs, which may provide statistical and practical insights to study new combination of antineoplastic agents for precision medicine. If an antineoplastic agent A produces the same cytotoxic effect as another drug B, and a combination of A and a third cytotoxic agent C has been approved to treat a specific malignancy, our findings suggest the feasibility of a novel combination of B and C (<xref ref-type="table" rid="table4">Table 4</xref>). Other possible combinations such as A+B and A+B+C may also be valuable to explore. Since various combinations can be followed to develop combined therapies, it is important to be aware of and remain current on all available clinical studies that may be relevant. Our knowledge graph will not only provide a visual representation of existing drug combinations, but also assist practitioners and experts to take full advantage of publicly disseminated clinical trials.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Major patterns of combined medication based on mechanisms of antineoplastic agents.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Combinations</td>
                <td>Number of Instances</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Cytotoxic + Cytotoxic</td>
                <td>68</td>
              </tr>
              <tr valign="top">
                <td>Targeted + Cytotoxic</td>
                <td>45</td>
              </tr>
              <tr valign="top">
                <td>Targeted + Targeted</td>
                <td>22</td>
              </tr>
              <tr valign="top">
                <td>Targeted + Cytotoxic + Cytotoxic</td>
                <td>17</td>
              </tr>
              <tr valign="top">
                <td>Cytotoxic + Other antineoplastic agent/adjuvant drugs</td>
                <td>15</td>
              </tr>
              <tr valign="top">
                <td>Immunotherapy + Targeted</td>
                <td>13</td>
              </tr>
              <tr valign="top">
                <td>Targeted + Other antineoplastic agent/adjuvant drugs</td>
                <td>11</td>
              </tr>
              <tr valign="top">
                <td>Immunotherapy + Cytotoxic</td>
                <td>10</td>
              </tr>
              <tr valign="top">
                <td>Cytotoxic + Cytotoxic + Cytotoxic</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>Others</td>
                <td>48</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Combined Drug Therapies Discovered in Published Clinical Trials and Clinical Practice Guidelines</title>
        <p>All of the combined drug therapies identified in this study were from published clinical trial reports, none of which has been included in clinical practice guidelines. We identified 28 of 31 (90.32%) abstracts in guidelines listed in PubMed by searching “antineoplastic agents” (Jan 2009 to Oct 2019). However, only 4/31 (12.90%) contained conclusive claims with the key words “conclusion*” and “conclude*”, with topics for single therapy (PMID: 20390116), intra-arterial chemotherapy (PMID: 23828325), curriculum in surgical oncology (PMID: 27145931), or drug management (PMID: 30381047). We then manually read the remaining guidelines and identified two combined drug therapies in one publication (PMID:21821491). We thus conclude that our method of parsing conclusive claims from PubMed abstracts may not be suitable for clinical practice guidelines, as a considerable number of these publications (87.10%) do not contain the necessary key words. Using structured abstracts after conversion or applying additional key words like “summar*” may improve the acquisition of conclusive claims. Although mentions of combined drug therapies are limited in clinical practice guidelines, our study focused on the discovery of combination therapies from published clinical trials, which inform the development of clinical practice guidelines.</p>
      </sec>
      <sec>
        <title>The Markers to Identify Potential Combined Drug Therapies</title>
        <p>The word “combin<bold>*</bold>” (namely “combine” or “combination”) is generally used to indicate the combined medication, an assumption affirmed by the data sampled here. Among 316 conclusive claims to automatically identified in this study (<xref ref-type="table" rid="table5">Table 5</xref>), 171 (54.11%) contain the marker “combin*” and 170 discuss drug combinations, while one described a combination of a drug and radiotherapy. We also noted “coadministration” (2 occurrences) and “co-administered” (1 occurrence) are markers similar to “combin*”, as is “regimen” (22 occurrence, 21 of which were for combined drug therapies) being an abbreviation of “antineoplastic combined chemotherapy regimens” [<xref ref-type="bibr" rid="ref29">29</xref>]. These markers will become key features in the development of our next deep learning–based knowledge discovery algorithm. After SemRep extraction of semantic relations from conclusive claims in the biomedical literature, we plan to add the Bidirectional Encoder Representations from Transformers [<xref ref-type="bibr" rid="ref30">30</xref>] model as a binary classifier using annotated data from two dimensions: the supporting conclusive claims and the factuality of semantic predications. The claims containing at least one of the identified markers will be used to classify the corresponding groups of semantic predications into positive knowledge about combined drug therapies.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Major makers to identify combined drug therapies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="358"/>
            <col width="124"/>
            <col width="271"/>
            <col width="247"/>
            <thead>
              <tr valign="top">
                <td>Markers</td>
                <td>Occurrence</td>
                <td>Combined drug therapy</td>
                <td>Other therapy</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>combin*</td>
                <td>171</td>
                <td>170</td>
                <td>drug &#38; radiotherapy</td>
              </tr>
              <tr valign="top">
                <td>coadministration</td>
                <td>2</td>
                <td>2</td>
                <td>N/A<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>co-administered</td>
                <td>1</td>
                <td>1</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>regimen (without markers above)</td>
                <td>22</td>
                <td>21</td>
                <td>Single therapy</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>The Utility and Major Applications of the Knowledge Graph for Combined Drug Therapies</title>
        <p>The knowledge graph of combined drug therapies will be an appropriate supplement to most leading knowledge bases, similar to SemMedDB [<xref ref-type="bibr" rid="ref31">31</xref>], which is a widely used publicly available repository extracted from biomedical literature by SemRep. However, the lack of knowledge concerning combinatorial effects is an important limitation of SemMedDB. Our study seeks to fill this gap by providing the combined medications to enrich the coverage and information provided by SemMedDB and other biomedical knowledge systems.</p>
        <p>The proposed knowledge graph has two major applications. An information retrieval system can utilize the knowledge from our graph to integrate various external sources of knowledge and information. Since the subjects and objects of the presented combined medications were drawn from the UMLS Metathesaurus by SemRep, it should be straightforward to integrate our graph with UMLS’s source vocabularies for information retrieval, such as DrugBank, Disease Ontology, NCI thesaurus, SNOMEDCT, etc. Another major application is precision medicine and clinical decision-making support. Combined drug therapies provide an alternative to conventional single therapies especially for malignant disorders. In order to pursue clinical and therapeutic approaches to optimal disease management based on individual variations in a patient's genetic profile, it is useful for an expert working with the treatment of a specific cancer to know which other therapies could also fit in that clinical practice. Manually reading the tremendous literature to find available combinations is undoubtedly laborious and time-consuming. Our knowledge graph will help experts quickly and easily identify efficacious combined therapies that may not be immediately evident by a manual survey of published clinical studies.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We have shown that semantic predications extracted from large-scale conclusive claims in biomedical research literature can be used to automatically discover and build a customized knowledge graph to represent existing knowledge about combination therapies. We found that additional filtering and evaluation steps were needed to accurately identify drug combinations from candidate results automatically discovered by the proposed algorithm. From 22,263 published clinical trials retrieved from PubMed, we automatically discovered 325 candidate groups of semantic predications, 255 of which (78.46%) were manually verified as accurate. Two major categories and four subcategories were identified to characterize 70 inaccurate results. To address this precision error, we conclude that additional filtering, context analysis, and feature extraction are required to eliminate single therapies and incorrect semantic predications of SemRep output through active learning [<xref ref-type="bibr" rid="ref32">32</xref>] or a factuality analyzer program [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
        <p/>
        <p>The proposed algorithm can be generalized to automatically discover generic combined medications for all human disorders, not just malignant neoplasms. It is also likely that a larger number of combined drug therapies could be identified in other types of biomedical publications, such as meta-analysis and comparative studies, in which combined medications are frequently addressed.</p>
        <p>By characterizing the major patterns of combinations according to the individual drug mechanisms, we found that combinations of two cytotoxic drugs are the most common for cancer treatment. Moreover, four apparent markers (“combin*”, “coadministration”, “co-administered” and “regimen”) were extracted as key features to further develop the machine learning-based knowledge discovery algorithm.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Discovered combined drug therapies.</p>
        <media xlink:href="medinform_v8i4e18323_app1.txt" xlink:title="TXT File , 24 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CUI</term>
          <def>
            <p>Concept Unique Identifier</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">MeSH</term>
          <def>
            <p>Medical Subject Headings</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NER</term>
          <def>
            <p>Named Entity Recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">PMID</term>
          <def>
            <p>PubMed ID/reference number</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">SemRep</term>
          <def>
            <p>Semantic Knowledge Representation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">SPR</term>
          <def>
            <p>Semantic Predicate Extraction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was funded by the National Natural Science Foundation of China, grant number 71603280 and the Young Elite Scientists Sponsorship Program by China Association for Science and Technology, grant number 2017QNRC001.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>JD supervised the project and administered the work. XYL sampled data and implemented the experimental testing. XYL prepared the initial draft of the manuscript and JD revised it. Both authors provided contributions to the final version of the paper and approved it.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>OTA</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>AKATSUKA</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>NISHI</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>KATO</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>TAKEUCHI</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>TSUJI</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>FUKUUCHI</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Phase I Study of Combination Therapy With Weekly Nanoparticle Albumin-bound Paclitaxel and Cyclophosphamide in Metastatic Breast Cancer Patients</article-title>
          <source>Anticancer Res</source>
          <year>2019</year>
          <month>12</month>
          <day>06</day>
          <volume>39</volume>
          <issue>12</issue>
          <fpage>6903</fpage>
          <lpage>6907</lpage>
          <pub-id pub-id-type="doi">10.21873/anticanres.13910</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jeffery</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Aspeslagh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Almouzni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Postel-Vinay</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Combining epigenetic drugs with other therapies for solid tumours — past lessons and future promise</article-title>
          <source>Nat Rev Clin Oncol</source>
          <year>2019</year>
          <month>9</month>
          <day>30</day>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>91</fpage>
          <lpage>107</lpage>
          <pub-id pub-id-type="doi">10.1038/s41571-019-0267-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sanderson</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Drug combination therapy increases successful drug repositioning</article-title>
          <source>Drug Discovery Today</source>
          <year>2016</year>
          <month>07</month>
          <volume>21</volume>
          <issue>7</issue>
          <fpage>1189</fpage>
          <lpage>1195</lpage>
          <pub-id pub-id-type="doi">10.1016/j.drudis.2016.05.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Yadav</surname>
              <given-names>TT</given-names>
            </name>
            <name name-style="western">
              <surname>Khair</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yergeri</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>Combination Therapies of Artemisinin and its Derivatives as a Viable Approach for Future Cancer Treatment</article-title>
          <source>CPD</source>
          <year>2019</year>
          <month>11</month>
          <day>14</day>
          <volume>25</volume>
          <issue>31</issue>
          <fpage>3323</fpage>
          <lpage>3338</lpage>
          <pub-id pub-id-type="doi">10.2174/1381612825666190902155957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Printz</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Two‐drug combination benefits patients with chronic lymphocytic leukemia</article-title>
          <source>Cancer</source>
          <year>2019</year>
          <month>12</month>
          <day>11</day>
          <volume>126</volume>
          <issue>1</issue>
          <fpage>13</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1002/cncr.32647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nurdiati</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hoede</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>25 years development of knowledge graph theory: the results and the challenge</article-title>
          <source>Memorandum</source>
          <year>2008</year>
          <fpage>1876</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salahuddin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mushtaq</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Materson</surname>
              <given-names>BJ</given-names>
            </name>
          </person-group>
          <article-title>Combination therapy for hypertension 2013: An update</article-title>
          <source>Journal of the American Society of Hypertension</source>
          <year>2013</year>
          <month>9</month>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>401</fpage>
          <lpage>407</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jash.2013.04.013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Semantic Health Knowledge Graph: Semantic Integration of Heterogeneous Medical Knowledge and Services</article-title>
          <source>BioMed Research International</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1155/2017/2858423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rotmensch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tlimat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Horng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Learning a Health Knowledge Graph from Electronic Medical Records</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>7</month>
          <day>20</day>
          <volume>7</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1038/s41598-017-05778-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamurias</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Couto</surname>
              <given-names>FM</given-names>
            </name>
          </person-group>
          <article-title>Generating a Tolerogenic Cell Therapy Knowledge Graph from Literature</article-title>
          <source>Front. Immunol</source>
          <year>2017</year>
          <month>11</month>
          <day>29</day>
          <volume>8</volume>
          <pub-id pub-id-type="doi">10.3389/fimmu.2017.01656</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vlietstra</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zielman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>van Dongen</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Schultes</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Wiesman</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Vos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Automated extraction of potential migraine biomarkers using a semantic graph</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2017</year>
          <month>07</month>
          <volume>71</volume>
          <fpage>178</fpage>
          <lpage>189</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.05.018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vlietstra</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sijbers</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Using predicate and provenance information from a knowledge graph for drug efficacy screening</article-title>
          <source>J Biomed Semant</source>
          <year>2018</year>
          <month>9</month>
          <day>6</day>
          <volume>9</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/s13326-018-0189-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Khoo</surname>
              <given-names>CSG</given-names>
            </name>
            <name name-style="western">
              <surname>Na</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Automatic identification of treatment relations for medical ontology learning: An exploratory study</article-title>
          <year>2004</year>
          <month>07</month>
          <day>13</day>
          <conf-name>In: Proceedings of the Eighth International ISKO Conference . Wurzburg, Germanyrgon Verlag. FREE Full text</conf-name>
          <conf-date>2004</conf-date>
          <conf-loc>London</conf-loc>
          <fpage>245</fpage>
          <lpage>250</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Large-scale extraction of accurate drug-disease treatment pairs from biomedical literature for drug repurposing</article-title>
          <source>BMC Bioinformatics</source>
          <year>2013</year>
          <month>6</month>
          <day>6</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>181</fpage>
          <lpage>191</lpage>
          <pub-id pub-id-type="doi">10.1186/1471-2105-14-181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Markatou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automated Acquisition of Disease-Drug Knowledge from Biomedical and Clinical Documents: An Initial Study</article-title>
          <source>Journal of the American Medical Informatics Association</source>
          <year>2008</year>
          <month>01</month>
          <day>01</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>87</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1197/jamia.m2401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Drug Repositioning to Accelerate Drug Development Using Social Media Data: Computational Study on Parkinson Disease</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>10</month>
          <day>11</day>
          <volume>20</volume>
          <issue>10</issue>
          <fpage>e271</fpage>
          <pub-id pub-id-type="doi">10.2196/jmir.9646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bchir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Karaa</surname>
              <given-names>WBA</given-names>
            </name>
          </person-group>
          <article-title>Extraction of drug-disease relations from MEDLINE abstracts</article-title>
          <year>2013</year>
          <month>06</month>
          <day>22</day>
          <conf-name>InWorld Congress on Computer and Information Technology (WCCIT). IEEE</conf-name>
          <conf-date>2013</conf-date>
          <conf-loc>Sousse, Tunisia</conf-loc>
          <fpage>1</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1109/wccit.2013.6618759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Predicting drug-disease interactions by semi-supervised graph cut algorithm and three-layer data integration</article-title>
          <source>BMC Med Genomics</source>
          <year>2017</year>
          <month>12</month>
          <day>28</day>
          <volume>10</volume>
          <issue>S5</issue>
          <pub-id pub-id-type="doi">10.1186/s12920-017-0311-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Knowledge-guided convolutional networks for chemical-disease relation extraction</article-title>
          <source>BMC Bioinformatics</source>
          <year>2019</year>
          <month>5</month>
          <day>21</day>
          <volume>20</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/s12859-019-2873-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The interaction of domain knowledge and linguistic structure in natural language processing: interpreting hypernymic propositions in biomedical text</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2003</year>
          <month>12</month>
          <volume>36</volume>
          <issue>6</issue>
          <fpage>462</fpage>
          <lpage>477</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2003.11.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Constructing Biomedical Knowledge Graph Based on SemMedDB and Linked Open Data</article-title>
          <year>2018</year>
          <month>12</month>
          <day>3</day>
          <conf-name>InIEEE International Conference on Bioinformatics and Biomedicine (BIBM). IEEE</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Madrid, Spain</conf-loc>
          <fpage>1628</fpage>
          <lpage>1631</lpage>
          <pub-id pub-id-type="doi">10.1109/bibm.2018.8621568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosemblat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Towards a characterization of apparent contradictions in the biomedical literature using context analysis</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2019</year>
          <month>10</month>
          <volume>98</volume>
          <fpage>103275</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103275</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bill</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <article-title>Using SemRep to label semantic relations extracted from clinical text</article-title>
          <year>2012</year>
          <month>11</month>
          <day>03</day>
          <conf-name>In: AMIA annual symposium proceedings. American Medical Informatics Association, , . FREE Full text Medline</conf-name>
          <conf-date>2012</conf-date>
          <conf-loc>Chicago, Illinois</conf-loc>
          <fpage>A</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cairelli</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosemblat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Using semantic predications to uncover drug–drug interactions in clinical data</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2014</year>
          <month>06</month>
          <volume>49</volume>
          <fpage>134</fpage>
          <lpage>147</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2014.01.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fathiamini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Araya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Holla</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Litzenburger</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Khotskaya</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Meric-Bernstam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstam</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Automated identification of molecular effects of drugs (AIMED)</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>04</month>
          <day>23</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>758</fpage>
          <lpage>765</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocw030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <source>Accessed November 19</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <access-date>2019-11-01</access-date>
          <comment>Medline pubmed production statistics<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html">https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rosemblat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>Constructing a semantic predication gold standard from the biomedical literature</article-title>
          <source>BMC Bioinformatics</source>
          <year>2011</year>
          <month>12</month>
          <day>20</day>
          <volume>12</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/1471-2105-12-486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bostock</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ogievetsky</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>D³ Data-Driven Documents</article-title>
          <source>IEEE Trans. Visual. Comput. Graphics</source>
          <year>2011</year>
          <month>12</month>
          <volume>17</volume>
          <issue>12</issue>
          <fpage>2301</fpage>
          <lpage>2309</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2011.185</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <source>MeSH Thesaurus</source>
          <access-date>2020-04-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://meshb.nlm.nih.gov/record/ui?ui=D000971">https://meshb.nlm.nih.gov/record/ui?ui=D000971</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding</article-title>
          <source>Computation and Language, 1-16. FREE Full text</source>
          <year>2019</year>
          <month>05</month>
          <day>04</day>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosemblat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>SemMedDB: a PubMed-scale repository of biomedical semantic predications</article-title>
          <source>Bioinformatics</source>
          <year>2012</year>
          <month>10</month>
          <day>08</day>
          <volume>28</volume>
          <issue>23</issue>
          <fpage>3158</fpage>
          <lpage>3160</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bts591</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vasilakes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rizvi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Evaluating active learning methods for annotating semantic predications</article-title>
          <source>JAMIA open, . FREE Full text  3074</source>
          <year>2018</year>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>0594</fpage>
          <lpage>282</lpage>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooy021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rosemblat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>Assigning factuality values to semantic relations extracted from biomedical research literature</article-title>
          <source>PLoS ONE</source>
          <year>2017</year>
          <month>7</month>
          <day>5</day>
          <volume>12</volume>
          <issue>7</issue>
          <fpage>e0179926</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0179926</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
