<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i8e16948</article-id>
      <article-id pub-id-type="pmid">32759099</article-id>
      <article-id pub-id-type="doi">10.2196/16948</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Semantic Deep Learning: Prior Knowledge and a Type of Four-Term Embedding Analogy to Acquire Treatments for Well-Known Diseases</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>He</surname>
            <given-names>Zhe</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Arguello Casteleiro</surname>
            <given-names>Mercedes</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9469-2068</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Des Diz</surname>
            <given-names>Julio</given-names>
          </name>
          <degrees>DPhil, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7121-4450</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Maroto</surname>
            <given-names>Nava</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0349-7716</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Fernandez Prieto</surname>
            <given-names>Maria Jesus</given-names>
          </name>
          <degrees>DPSI</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2312-1414</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Peters</surname>
            <given-names>Simon</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7317-9182</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Wroe</surname>
            <given-names>Chris</given-names>
          </name>
          <degrees>BChir, MD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6538-8187</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Sevillano Torrado</surname>
            <given-names>Carlos</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8689-3580</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Maseda Fernandez</surname>
            <given-names>Diego</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2678-3360</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Stevens</surname>
            <given-names>Robert</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Computer Science</institution>
            <institution>University of Manchester</institution>
            <addr-line>Kilburn Building, Oxford Road, M13 9PL</addr-line>
            <addr-line>Manchester, </addr-line>
            <country>United Kingdom</country>
            <phone>44 161 275 6251</phone>
            <email>robert.stevens@manchester.ac.uk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6038-9025</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science</institution>
        <institution>University of Manchester</institution>
        <addr-line>Manchester</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Hospital do Salnés</institution>
        <addr-line>Villagarcía de Arousa</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Departamento de Lingüística Aplicada a la Ciencia y a la Tecnología</institution>
        <institution>Universidad Politécnica de Madrid</institution>
        <addr-line>Madrid</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Salford Languages</institution>
        <institution>University of Salford</institution>
        <addr-line>Salford</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>School of Social Sciences</institution>
        <institution>University of Manchester</institution>
        <addr-line>Manchester</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>BMJ</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Mid Cheshire Hospital Foundation Trust</institution>
        <institution>NHS England</institution>
        <addr-line>Crewe</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Robert Stevens <email>robert.stevens@manchester.ac.uk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>8</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>8</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>8</issue>
      <elocation-id>e16948</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>28</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>27</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>27</day>
          <month>2</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Mercedes Arguello Casteleiro, Julio Des Diz, Nava Maroto, Maria Jesus Fernandez Prieto, Simon Peters, Chris Wroe, Carlos Sevillano Torrado, Diego Maseda Fernandez, Robert Stevens. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 06.08.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2020/8/e16948" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>How to treat a disease remains to be the most common type of clinical question. Obtaining evidence-based answers from biomedical literature is difficult. Analogical reasoning with embeddings from deep learning (embedding analogies) may extract such biomedical facts, although the state-of-the-art focuses on pair-based proportional (pairwise) analogies such as man:woman::king:queen (“<italic>queen = −man +king +woman</italic>”).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to systematically extract disease treatment statements with a Semantic Deep Learning (SemDeep) approach underpinned by prior knowledge and another type of 4-term analogy (other than pairwise).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>As preliminaries, we investigated Continuous Bag-of-Words (CBOW) embedding analogies in a common-English corpus with five lines of text and observed a type of 4-term analogy (not pairwise) applying the 3CosAdd formula and relating the semantic fields <italic>person</italic> and <italic>death</italic>: “dagger = −Romeo +die +died” (search query: −<italic>Romeo +die +died</italic>). Our SemDeep approach worked with pre-existing items of knowledge (what is known) to make inferences sanctioned by a 4-term analogy (search query −<italic>x +z1 +z2</italic>) from CBOW and Skip-gram embeddings created with a PubMed systematic reviews subset (PMSB dataset). Stage1: Knowledge acquisition. Obtaining a set of terms, candidate y, from embeddings using vector arithmetic. Some n-gram pairs from the cosine and validated with evidence (prior knowledge) are the input for the 3cosAdd, seeking a type of 4-term analogy relating the semantic fields disease and treatment. Stage 2: Knowledge organization. Identification of candidates sanctioned by the analogy belonging to the semantic field treatment and mapping these candidates to unified medical language system Metathesaurus concepts with MetaMap. A concept pair is a brief disease treatment statement (biomedical fact). Stage 3: Knowledge validation. An evidence-based evaluation followed by human validation of biomedical facts potentially useful for clinicians.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We obtained 5352 n-gram pairs from 446 search queries by applying the 3CosAdd. The microaveraging performance of MetaMap for candidate <italic>y</italic> belonging to the semantic field <italic>treatment</italic> was F-measure=80.00% (precision=77.00%, recall=83.25%). We developed an empirical heuristic with some predictive power for <italic>clinical winners</italic>, that is, search queries bringing candidate <italic>y</italic> with evidence of a therapeutic intent for target disease <italic>x</italic>. The search queries <italic>-asthma +inhaled_corticosteroids +inhaled_corticosteroid</italic> and <italic>-epilepsy +valproate +antiepileptic_drug</italic> were <italic>clinical winners</italic>, finding eight evidence-based beneficial treatments.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Extracting treatments with therapeutic intent by analogical reasoning from embeddings (423K n-grams from the PMSB dataset) is an ambitious goal. Our SemDeep approach is knowledge-based, underpinned by embedding analogies that exploit prior knowledge. Biomedical facts from embedding analogies (4-term type, not pairwise) are potentially useful for clinicians. The heuristic offers a practical way to discover beneficial treatments for well-known diseases. Learning from deep learning models does not require a massive amount of data. Embedding analogies are not limited to pairwise analogies; hence, analogical reasoning with embeddings is underexploited.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>evidence-based practice</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>deep learning</kwd>
        <kwd>semantic deep learning</kwd>
        <kwd>analogical reasoning</kwd>
        <kwd>embedding analogies</kwd>
        <kwd>PubMed</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>How to treat a disease or condition remains to be the most common type of clinical question [<xref ref-type="bibr" rid="ref1">1</xref>]. It is difficult for clinicians to obtain comprehensive information on the clinical (and economic) worth of alternative drug choices for a given condition [<xref ref-type="bibr" rid="ref2">2</xref>]. Evidence-based biomedical literature, although available in electronic form, primarily remains to be expert-to-expert communication—natural language statements intended for human consumption.</p>
      <p>Analogical reasoning is basic relational reasoning without explicit representations of relations [<xref ref-type="bibr" rid="ref3">3</xref>]. An acknowledged semantic property of embeddings (ie, vectors representing terms) from deep learning [<xref ref-type="bibr" rid="ref4">4</xref>] is “<italic>their ability to capture relational meanings</italic>” [<xref ref-type="bibr" rid="ref5">5</xref>], the so-called analogies [<xref ref-type="bibr" rid="ref6">6</xref>]. Current efforts in analogical reasoning with embeddings focus on pair-based proportional analogies [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. This is a type of “<italic>the four-term analogy</italic>” [<xref ref-type="bibr" rid="ref6">6</xref>], also known as the cross-mapping analogy [<xref ref-type="bibr" rid="ref6">6</xref>]. An example is <italic>queen = −man +king +woman</italic> [<xref ref-type="bibr" rid="ref9">9</xref>], also represented as man:woman::king:queen [<xref ref-type="bibr" rid="ref10">10</xref>], and read as “<italic>man is to king as woman is to queen</italic>” [<xref ref-type="bibr" rid="ref11">11</xref>]. Examples for health care include the following:</p>
      <list list-type="bullet">
        <list-item>
          <p>“<italic>'acetaminophen' is as type of 'drug' as 'diabetes' is as type of ‘disease’</italic>” [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        </list-item>
        <list-item>
          <p>“<italic>(furosemide - kidney) + heart ~ fosinopril</italic>” [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        </list-item>
      </list>
      <p>This study aimed to investigate embedding analogies (analogical reasoning with embeddings) [<xref ref-type="bibr" rid="ref5">5</xref>] that are not pair-based proportional (pairwise for short) analogies. This study began by observing senior clinicians performing an analogical reasoning for sepsis (a major life-threatening condition) with embeddings and posing search queries such as <italic>−sepsis +serum_albumin +fluid_therapy</italic> to discover treatments with therapeutic intent. The clinical rationale behind this query is that “<italic>current evidence suggests that resuscitation using albumin-containing solutions is safe</italic>” [<xref ref-type="bibr" rid="ref14">14</xref>], where <italic>serum_albumin</italic> is a shortened form of “<italic>human serum albumin supplementation</italic>” (extensively debated for sepsis [<xref ref-type="bibr" rid="ref15">15</xref>]). We viewed this as another type of <italic>the four-term analogy,</italic> which is not pairwise.</p>
      <p>This paper presents a semiautomatic approach to extract meaning (semantics) from the unstructured free text of biomedical literature (ie, PubMed systematic reviews [<xref ref-type="bibr" rid="ref16">16</xref>]). The disease treatment statements systematically acquired from analogical reasoning are biomedical facts validated with evidence first and human audit afterward. The approach presented belongs to Semantic Deep Learning (SemDeep) [<xref ref-type="bibr" rid="ref17">17</xref>], as we used embedding analogies (other than pairwise) and semantic knowledge representation paradigms [<xref ref-type="bibr" rid="ref18">18</xref>] to provide meaning for the same.</p>
      <sec>
        <title>Analogical Reasoning</title>
        <p>Humans possess the ability to reason by analogy using abstract semantic relations such as synonyms or category membership [<xref ref-type="bibr" rid="ref3">3</xref>]. For example, <italic>common cold</italic> and <italic>influenza</italic> are both types of illnesses with some common symptoms such as runny nose, sore throat, cough, and headache. As they share some key characteristics, we can possibly say they are near-synonyms, although they cannot be used interchangeably (as synonyms would) because of key medical differences. Our SemDeep approach acquires terms about treatments for a well-known disease using analogical reasoning that is underpinned by Aristotle’s theory [<xref ref-type="bibr" rid="ref19">19</xref>]:</p>
        <list list-type="bullet">
          <list-item>
            <p>“<italic>The strength of an analogy depends upon the number of similarities</italic>” [<xref ref-type="bibr" rid="ref19">19</xref>]. For example, “intravenous antibiotics” and “intravenous fluid resuscitation” are basic therapies that improve outcomes in patients with sepsis [<xref ref-type="bibr" rid="ref14">14</xref>], that is, both are treatments with a therapeutic intent for sepsis. However, we cannot say that they are similar as “intravenous fluid resuscitation” is a procedure whereas an “intravenous antibiotic” is a substance, although both are “intravenous.”</p>
          </list-item>
          <list-item>
            <p>“<italic>Similarity reduces to identical properties and relations</italic>” [<xref ref-type="bibr" rid="ref19">19</xref>]. For example, “benzyl penicillin,” “cefotaxime,” or “amoxicillin/clavulanate” is similar as they belong to the same category, “antipseudomonal beta-lactam antibiotics” [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
          </list-item>
          <list-item>
            <p>"<italic>Good analogies derive from underlying common causes or general laws</italic>” [<xref ref-type="bibr" rid="ref19">19</xref>]. This study investigated the systematic acquisition of treatments for a disease using the simple generic 3CosAdd formula [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>The 3CosAdd Formula</title>
        <p>Our work relied on vector semantics [<xref ref-type="bibr" rid="ref5">5</xref>] and used the neural language models, Continuous Bag-of-Words (CBOW) and Skip-gram by Mikolov et al [<xref ref-type="bibr" rid="ref20">20</xref>], from deep learning to create embeddings. Embeddings with vector semantics such as cosine or 3CosAdd can acquire a list of strings of characters (eg, n-grams), although they lack explicit semantic meaning. Until now, the 3CosAdd formula 1 [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] has been applied to analogies between 2 pairs of words a:a*::b:b* [<xref ref-type="bibr" rid="ref7">7</xref>], where b* is the unknown (hidden) word.</p>
        <graphic xlink:href="medinform_v8i8e16948_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        <p>We used the 3CosAdd formula as in Levy and Goldberg [<xref ref-type="bibr" rid="ref21">21</xref>] with the rewording “<italic>find the term y, which is similar to the term z1 and the term z2, while different from the term x</italic>”, where the target term <italic>x</italic> provides the semantic context and similar refers to the terms sharing “commonalities in structural features.” In this study, a semantic field is a set of terms that “<italic>belong together under the same conceptual heading</italic>” [<xref ref-type="bibr" rid="ref22">22</xref>] and is a form of knowledge representation that provides meaning to those terms. We rewrote the 3CosAdd formula as formula 2, with the search query <italic>-x +z1 +z2</italic>, and the type of 4-term analogy we sought had the following:</p>
        <list list-type="bullet">
          <list-item>
            <p>The target term <italic>x</italic> belonging to the semantic field <italic>disease</italic> and representing a medical diagnosis mappable to a “type of” of systematized nomenclature of medicine - clinical terms (SNOMED CT) [<xref ref-type="bibr" rid="ref23">23</xref>] concept called disorder.</p>
          </list-item>
          <list-item>
            <p>The 3 terms {<italic>z1; z2; y</italic>} belonging to the semantic field <italic>treatment</italic>(Tx for short), where Tx encompasses 3 textual definitions from Hart et al [<xref ref-type="bibr" rid="ref24">24</xref>]. The candidate term <italic>y</italic> is the unknown.</p>
          </list-item>
        </list>
        <graphic xlink:href="medinform_v8i8e16948_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </sec>
      <sec>
        <title>The Research Questions</title>
        <p>We adopted the view by Hill et al [<xref ref-type="bibr" rid="ref25">25</xref>] by considering “relatedness” as “association” and synonymy as the strongest similarity. In this study, the association relationship of interest is “correlation,” as defined in the semantic science integrated ontology (SIO) [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>As preliminaries, we asked 2 research questions not specific to the health care domain:</p>
        <list list-type="bullet">
          <list-item>
            <p>Q1: Can “good” embeddings be created with a small corpus?</p>
          </list-item>
          <list-item>
            <p>Q2: If the simple generic 3CosAdd formula [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] can capture a type of 4-term analogy as read in formula 2, can they be observed in embeddings created with a small corpus?</p>
          </list-item>
        </list>
        <p>Our third research question (Q3) asked whether the 4-term type of analogy discovered in a small common-English corpus can also be discovered in a larger-scale biomedical corpus. To provide proof of such a generalization, we performed a real-world test with embeddings created with free text from PubMed systematic reviews [<xref ref-type="bibr" rid="ref16">16</xref>]. We postulated that candidate inferences can be validated using evidence-based information resources. This study investigated the discovery of <italic>clinical winners</italic>, that is, search queries <italic>-x +z1 +z2</italic> bringing candidate treatments <italic>y</italic> with evidence of a therapeutic intent for target disease <italic>x</italic>; thus, enabling the most common type of clinical question, “how to treat a disease or condition” [<xref ref-type="bibr" rid="ref1">1</xref>], to be answered.</p>
        <p>Our final research question (Q4) asked for some predictive power over the <italic>clinical winners</italic> obtained (ie, an empirical heuristic) if our SemDeep approach worked, that is the type of analogy proposed finds disease treatment statements from PubMed systematic reviews (ie, a larger-scale biomedical corpus). This last question pursued a tacit preference and referred to the final characteristic of analogy: systematicity [<xref ref-type="bibr" rid="ref6">6</xref>]. However, challenges have been acknowledged “for any vector space model that aims to make predictions about relational similarity” [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <p>Between the semantic field <italic>disease</italic> and the semantic field <italic>treatment</italic>, “<italic>few maximal structurally consistent interpretations (ie, mappings displaying one-to-one correspondences and parallel connectivity)</italic>” [<xref ref-type="bibr" rid="ref6">6</xref>] are to be expected. For example, aspirin treatment does not have a one-to-one correspondence with a disease as it can treat headache (common knowledge) and acute myocardial infarction [<xref ref-type="bibr" rid="ref1">1</xref>]. In this study, “spontaneous unplanned inferences” [<xref ref-type="bibr" rid="ref6">6</xref>] were also expected, and this propensity was captured with the notion of incremental mappings [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>Our SemDeep approach answered Q3 and comprised the 3 stages depicted in <xref rid="figure1" ref-type="fig">Figure 1</xref>. The software package word2vec [<xref ref-type="bibr" rid="ref28">28</xref>] implements the CBOW and Skip-gram algorithms along with the cosine and 3CosAdd formulas. The terms in this study are n-grams.</p>
        <p>Stage 1 used prior knowledge (open-access reusable datasets [<xref ref-type="bibr" rid="ref29">29</xref>]) consisting of n-gram pairs obtained by applying the cosine to embeddings, then mapped to the Unified Medical Language System (UMLS) Metathesaurus [<xref ref-type="bibr" rid="ref30">30</xref>] concept pairs, and finally validated with evidence from biomedical literature using the British Medical Journal (BMJ) Best Practice [<xref ref-type="bibr" rid="ref31">31</xref>] as the main information source.</p>
        <p>BMJ Best Practice is separate from PubMed/MEDLINE [<xref ref-type="bibr" rid="ref32">32</xref>] and is acknowledged for its editorial quality and evidence-based methodology [<xref ref-type="bibr" rid="ref33">33</xref>]. In the United Kingdom, BMJ Best Practice is provided (free access) to all National Health Service (NHS) health care professionals in England, Scotland, and Wales [<xref ref-type="bibr" rid="ref34">34</xref>]. BMJ Best Practice provides advice on symptom evaluation, tests to order, and treatment approach structured around the patient consultation.</p>
        <p>We started by investigating embedding analogies in a small common-English corpus to answer Q1 and Q2.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of our SemDeep approach.</p>
          </caption>
          <graphic xlink:href="medinform_v8i8e16948_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Preliminaries: Analogies for Shakespeare’s Romeo in a Small Common-English Corpus</title>
        <p>Topic models are related to semantic fields [<xref ref-type="bibr" rid="ref5">5</xref>]. There are many small corpora and tutorials illustrating the inner workings of topic models, such as the spatially motivated Latent Semantic Analysis (LSA) method [<xref ref-type="bibr" rid="ref35">35</xref>] and the probabilistic method latent Dirichlet allocation (LDA) [<xref ref-type="bibr" rid="ref36">36</xref>]. We used a small common-English corpus appearing in an LSA tutorial [<xref ref-type="bibr" rid="ref37">37</xref>]. <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> shows the corpus used to answer Q1 and Q2.</p>
        <boxed-text id="box1" position="float">
          <title>A small common-English corpus consisting of 5 lines of text.</title>
          <p>Romeo and Juliet</p>
          <p>Juliet: Oh happy dagger!</p>
          <p>Romeo died by dagger.</p>
          <p>“Live free or die”, that’s the New-Hampshire’s motto</p>
          <p>Did you know New-Hampshire is in New-England?</p>
        </boxed-text>
        <p>In common English, punctuation marks can change the meaning of a sentence. For example, “prevail, not perish” versus “prevail not, perish.” We did not transform routine letters into lowercase letters and did not remove punctuation marks, with the only exception of double quotations. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> contains the input text and the hyperparameter configuration for the CBOW model with word2vec [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        <p>Below, we summarize the answers to Q1 and Q2 (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>):</p>
        <list list-type="bullet">
          <list-item>
            <p>Answer to Q1: A “good” vector semantic model should find a candidate <italic>y</italic> that is “semantically similar” to the target <italic>x = Romeo</italic>. The candidate <italic>y</italic> with the highest cosine for the CBOW model is <italic>you</italic>: The terms <italic>you</italic> and <italic>Romeo</italic> are near-synonyms, that is “interchangeable in some contexts” [<xref ref-type="bibr" rid="ref38">38</xref>]. Hence, the answer to Q1 is “yes.”</p>
          </list-item>
          <list-item>
            <p>Answer to Q2: We applied the 3CosAdd formula 2, where the target <italic>x = Romeo</italic> provides the semantic context. The terms <italic>die = z1</italic> and <italic>died = z2</italic> from the corpus are representative of inflectional morphology <italic>infinitive:past</italic>. The search query <italic>–x +z1 +z2</italic> is posed to the CBOW model, that is “find the term <italic>y</italic>, which is similar to <italic>die</italic> and <italic>died</italic>, while different from <italic>Romeo</italic>”. Candidate <italic>y</italic> with the highest 3CosAdd is “<italic>dagger</italic>.” The term <italic>dagger</italic> belongs to the semantic field <italic>death</italic> as “dagger is an instrument that causes death”; thus, the candidate inference is true. Hence, the answer to Q2 is also “yes.”</p>
          </list-item>
        </list>
        <sec>
          <title>Stage 1: Knowledge Acquisition (Acquisition of Domain-Specific Terms)</title>
          <p>The PubMed systematic reviews (in <xref rid="figure1" ref-type="fig">Figure 1</xref>) [<xref ref-type="bibr" rid="ref16">16</xref>] is an evidence-based searching filter “AND (systematic [sb])”, intended for retrieving “best evidence” information sources from PubMed/MEDLINE [<xref ref-type="bibr" rid="ref32">32</xref>] such as Cochrane systematic reviews [<xref ref-type="bibr" rid="ref39">39</xref>]. Health care–related institutions such as the World Health Organization promote PubMed searches with this filter (examples in Prevention and Control of Noncommunicable Diseases: Guidelines for Primary Health Care in Low Resource Settings [<xref ref-type="bibr" rid="ref40">40</xref>]).</p>
          <p>This study used a subset of PubMed systematic reviews [<xref ref-type="bibr" rid="ref16">16</xref>] of 301,201 PubMed/MEDLINE publications (titles and available abstracts), called the PubMed systematic reviews subset (PMSB dataset). The preprocessing of the input text for the PMSB dataset and the hyperparameter configuration for Skip-gram and CBOW are identical to those in our previous study [<xref ref-type="bibr" rid="ref41">41</xref>] and detailed in the study by Arguello Casteleiro et al [<xref ref-type="bibr" rid="ref42">42</xref>].</p>
          <p>From the PMSB dataset, a total of 423K n-grams with a frequency count &#62;5 have vector representations in both models, that is CBOW and Skip-gram. We considered “good” the Skip-gram and CBOW embeddings created in our previous study [<xref ref-type="bibr" rid="ref41">41</xref>] as they both perform well (using conventional evaluation measure precision [<xref ref-type="bibr" rid="ref43">43</xref>]) in semantic similarity and relatedness tasks with the cosine formula. The n-gram <italic>z</italic> reused in this study (ie, z1 and z2) is from our previous study [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Applying the 3CosAdd Formula to Acquire the Top 12 Ranked Term Pairs (x,y): A 4-Term Analogy</title>
        <p>To address Q3 and apply the 3CosAdd formula 2, 2 n-gram pairs (disease <italic>x</italic>,treatment <italic>z</italic>) from our previous study (prior knowledge) [<xref ref-type="bibr" rid="ref41">41</xref>] were needed. We kept only the 12 top-ranked candidate n-grams <italic>y</italic> for the 3CosAdd formula, that is, the 12-candidate <italic>y</italic> with CBOW and Skip-gram embeddings yielding the highest 3CosAdd values. We limited the list of candidates to 12, similar to Arguello Casteleiro et al [<xref ref-type="bibr" rid="ref42">42</xref>], and following cognitive theories like Novak JD and Cañas AJ [<xref ref-type="bibr" rid="ref44">44</xref>].</p>
        <sec>
          <title>Stage 2: Knowledge Organization (Explicit Conceptualization of the Meaning of Terms)</title>
          <p>This stage accomplishes a named entity recognition (NER) [<xref ref-type="bibr" rid="ref45">45</xref>] task involving 3 domain experts (2 biomedical terminologists and 1 medical consultant who performs clinical coding). Every UMLS Metathesaurus concept has a concept unique identifier (CUI) and at least one UMLS Semantic Type (broad category) [<xref ref-type="bibr" rid="ref30">30</xref>] assigned. The NER task consists of 3 sequential subtasks (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>):</p>
          <list list-type="bullet">
            <list-item>
              <p>First, disambiguation of n-grams <italic>y</italic> is difficult to interpret for being truncated strings of characters or containing short forms (eg, abbreviations or acronyms). String searches in the PMSB dataset and the web search the sense inventory, Allie [<xref ref-type="bibr" rid="ref46">46</xref>], enabling disambiguation.</p>
            </list-item>
            <list-item>
              <p>Second, the manual binary classification of candidate n-gram <italic>y</italic> as to whether it belongs to the semantic field Tx (ie, <italic>y<sub>Tx</sub></italic>). Following Artstein R and Poesio M [<xref ref-type="bibr" rid="ref47">47</xref>], we reported the interrater agreement with a Krippendorff alpha [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
            </list-item>
            <list-item>
              <p>Third, entity normalization (grounding) [<xref ref-type="bibr" rid="ref49">49</xref>] with MetaMap [<xref ref-type="bibr" rid="ref50">50</xref>], where 3 domain experts apply the NER guidelines for MetaMap's output [<xref ref-type="bibr" rid="ref51">51</xref>] and together judge the automatic mapping of n-grams <italic>y<sub>Tx</sub></italic> to UMLS Metathesaurus concepts <italic>Y<sub>Tx</sub></italic>. MetaMap performance is calculated using precision, recall, and F-measure [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref52">52</xref>].</p>
            </list-item>
          </list>
          <p>We took n1 as the number of different UMLS Metathesaurus concepts (represented as Z1 and Z2) mapped as <italic>z1</italic> and <italic>z2</italic> in the search query. Once the NER task was completed, we obtained the <italic>NER winners</italic>. An <italic>NER winner</italic> was a search query <italic>-x +z1 +z2</italic> with the maximum observed number for n2 or n3:</p>
          <list list-type="bullet">
            <list-item>
              <p>n2 is the number of different 12 top-ranked candidate n-grams <italic>y</italic> belonging to Tx, that is, the number of <italic>y<sub>Tx</sub></italic>.</p>
            </list-item>
            <list-item>
              <p>n3 is the number of different UMLS Metathesaurus concepts <italic>Y<sub>Tx</sub></italic> excluding Z1 and Z2.</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>Stage 3: Knowledge Validation (Validating Statements)</title>
          <p>We sought evidence for the Metathesaurus concept pairs (<italic>X,Y<sub>Tx</sub></italic>) acquired previously to determine the therapeutic intent of candidate <italic>Y<sub>Tx</sub></italic> for target disease <italic>X</italic>, where <italic>X</italic> was the UMLS Metathesaurus concept mapped to n-gram <italic>x</italic>.</p>
          <p>The same 3 domain experts from Stage 2 triaged the results of manual literature searches considering the following:</p>
          <list list-type="order">
            <list-item>
              <p>The type of evidence-based information sources, seeking the “best evidence.” Evidence-based medicine [<xref ref-type="bibr" rid="ref53">53</xref>] categorizes and ranks different types of clinical evidence [<xref ref-type="bibr" rid="ref1">1</xref>]. For example, the Cochrane systematic reviews are at the forefront of “best evidence” [<xref ref-type="bibr" rid="ref1">1</xref>], whereas studies of the physiological functions and clinicians’ observations are considered evidence of least value [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
            </list-item>
            <list-item>
              <p>The publication date, seeking the “most recent papers published.”</p>
            </list-item>
          </list>
          <p>The 3 domain experts introduced 6 evidence-based categories to further refine the correlations between the semantic field <italic>disease</italic> and <italic>treatment</italic> (Tx). <xref ref-type="table" rid="table1">Table 1</xref> illustrates them with examples of evidence (quoted text) and references for the UMLS Metathesaurus concepts <italic>Y<sub>Tx</sub></italic> related to the target concept disease <italic>X</italic>=“C024302&#124;Sepsis” with CUI=C024302. The rationale for the 7 evidence-based categories introduced is as follows:</p>
          <list list-type="bullet">
            <list-item>
              <p>The name of 4 of the evidence-based categories (top rows in <xref ref-type="table" rid="table1">Table 1</xref>) resembles the categories “beneficial, likely beneficial, no known benefit, harmful” for health care interventions from the decommissioned BMJ Clinical Evidence (predecessor of BMJ Best Practice [<xref ref-type="bibr" rid="ref31">31</xref>]).</p>
            </list-item>
            <list-item>
              <p>The evidence-based category “Tx ingredient” acknowledges that a complex treatment may have parts, that is “partitive relationships” [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
            </list-item>
            <list-item>
              <p>The evidence-based category “correlation” captures “spontaneous unplanned inferences” [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
            </list-item>
            <list-item>
              <p>The evidence-based category “general medical term” includes broad concepts of little value for clinicians that do not need further evidence (quotes and references).</p>
            </list-item>
          </list>
          <p>This study distinguishes between <italic>NER winners</italic> (maximum observed number for n2 or n3 in Stage 2) and <italic>clinical winners</italic>. A <italic>clinical winner</italic> is a search query <italic>-x +z1 +z2</italic> (a type of 4-term analogy) for target disease <italic>x</italic> with a maximum observed value for n4, that is, the number of different concepts <italic>Y<sub>Tx</sub></italic> (excluding Z1 and Z2) assigned to the evidence-based category “Tx with therapeutic effect.”</p>
          <p>To audit the evidence-based categories assigned along with the evidence collected (quotes and references) for the concept pairs (<italic>X,Y<sub>Tx</sub></italic>), 2 more observers (O1 a medical consultant and O2 a BMJ health informatician who works with BMJ Best Practice content and has a junior doctor background) were asked to express agreement or disagreement with the evidence for the concept pairs (<italic>X,Y<sub>Tx</sub></italic>). <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> has the evaluation guidelines given to the observers. Cohen kappa [<xref ref-type="bibr" rid="ref55">55</xref>] was used to measure interobserver agreement.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Evidence from the literature searches, that is quoted text and reference, for unified medical language system Metathesaurus concept pairs (X, Y<sub>Tx</sub>) with X=C0243026&#124;Sepsis.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="280"/>
              <col width="230"/>
              <col width="490"/>
              <thead>
                <tr valign="top">
                  <td>Candidate concept <italic>Y</italic><sub><italic>Tx</italic></sub>; UMLS CUI&#124;Concept name<sup>a</sup></td>
                  <td>Evidence-based categories for concept <italic>Y</italic><sub><italic>Tx</italic></sub> correlated with concept <italic>X</italic></td>
                  <td>Evidence (quoted text) [evidence source] [citation]</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>C0056562&#124;crystalloid solutions</td>
                  <td>Tx with therapeutic effect</td>
                  <td>“Step-by-step treatment approach: ... Administer 30 mL/kg crystalloid for hypotension or lactate ≥4 mmol/L (≥36 mg/dL)” [BMJ BP topic: 245] [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0001617&#124;Adrenal Cortex Hormones</td>
                  <td>Tx with uncertain therapeutic effect</td>
                  <td>“Step-by-step treatment approach: Adjunctive therapies ... evidence for giving corticosteroids to patients with sepsis or septic shock is mixed.” [BMJ BP topic: 245] [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0020352&#124;Hetastarch</td>
                  <td>Tx with unwanted or adverse effects (ie, nontherapeutic)</td>
                  <td>“Step-by-step treatment approach: Fluid resuscitation ... HES solutions for infusion have been significantly restricted across the European Union and are contraindicated in critically ill patients and those with sepsis or renal impairment.” [BMJ BP topic: 245] [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0677850&#124;Adjuvant therapy</td>
                  <td>Potential Tx (under research and development)</td>
                  <td>“Adjuvant immune therapy to manipulate the hyper-inflammatory and/or immune-suppressive phase of sepsis is an attractive therapeutic option, which may improve outcome and ease the burden of antimicrobial resistance. However, before this can become a clinical reality, we must recognise that sepsis is a clinical syndrome, where significant heterogeneity exists.” [PMID: 30515242] [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C3273371&#124;CD4 Positive Memory T-Lymphocyte</td>
                  <td>Tx ingredient</td>
                  <td>“Administration of immune-modulatory therapy is a promising treatment approach for treating sepsis survivors. … these therapies can improve pathogen clearance, increase CD4 T cell responsiveness, and promote survival in sepsis.” [PMID: 24791959] [<xref ref-type="bibr" rid="ref57">57</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0745442&#124;Intravenous Catheters</td>
                  <td>Tx ingredient</td>
                  <td>“Recommendations: Monitoring ... Central venous catheters will be required to ensure reliable delivery of vasoactive medication.” [BMJ BP topic: 245] [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0812144&#124;Medication administration: epidural</td>
                  <td>Correlation (epidural → potential sites of infection: epidural sites → sepsis: investigations)</td>
                  <td>“Investigations to identify causative organisms: ... If no localising signs are present, examination and culture of all potential sites of infection including wounds, catheters, prosthetic implants, epidural sites, and pleural or peritoneal fluid, as indicated by the clinical presentation and history, is required.” [BMJ BP topic: 245] [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>C0013227&#124;Pharmaceutical Preparations</td>
                  <td>General medical term</td>
                  <td>—<sup>b</sup></td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>The references shown are either the PubMed identifier (PMID) or the topic number in BMJ Best Practice (“BMJ BP topic” for short).</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>The evidence-based category “general medical term” has no evidence (quoted text).</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>We obtained 5352 n-gram pairs from 446 search queries by applying the 3CosAdd formula and taking the top 12 values. These are presented in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 1). These n-gram pairs are enriched with domain knowledge meaning (Stage 2) and the biomedical evidence found from literature searches is ratified with an audit (Stage 3).</p>
      <sec>
        <title>Stage 1: Knowledge Acquisition (Acquisition of Domain-Specific Terms)</title>
        <p>To apply the 3CosAdd formula (and systematic creation of search queries), we reused 63 unique n-gram pairs (<italic>x,z</italic>) from our previous study [<xref ref-type="bibr" rid="ref41">41</xref>] (open-access [<xref ref-type="bibr" rid="ref29">29</xref>]). Every reused n-gram <italic>z</italic> was mapped to the UMLS concept <italic>Z</italic> with the UMLS Semantic Type “T061&#124;Therapeutic or Preventive Procedure” or “T121&#124;Pharmacologic Substance.” <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> has the UMLS CUI pairs (<italic>X,Z</italic>).</p>
        <sec>
          <title>Applying the 3CosAdd Formula to Acquire the Top 12 Ranked Term Pairs (x,y): A 4-Term Analogy</title>
          <p>With 63 n-gram pairs (<italic>x,z</italic>), we built 223 search queries <italic>-x +z1 +z2</italic> for the 3CosAdd formula. <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 1) contains the 223 search queries and the 5352 (<italic>x,y</italic>) n-gram pairs for 10 target diseases <italic>x</italic>, that is, the 12 top-ranked n-grams (highest 3CosAdd value) obtained per search query from the CBOW and Skip-gram embeddings. An n-gram pair with <italic>y</italic> as a non-ASCII character was discarded.</p>
        </sec>
      </sec>
      <sec>
        <title>Stage 2: Knowledge Organization (Explicit Conceptualization of the Meaning of Terms)</title>
        <p>Different search queries brought the same (target <italic>x</italic>,candidate <italic>y</italic>) n-gram pairs from applying the 3CosAdd formula. <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 2) has 1935 unique (<italic>x,y</italic>) n-gram pairs from the 5352 n-gram pairs. Among the 1935 unique (<italic>x,y</italic>) n-gram pairs, there were 954 n-gram pairs (<italic>x,y<sub>Tx</sub></italic>) with candidate <italic>y</italic> belonging to Tx. The Krippendorff alpha [<xref ref-type="bibr" rid="ref48">48</xref>] was 0.86 for the 3 domain experts for the binary classification (Tx or non-Tx). Considering all candidates <italic>y<sub>Tx</sub></italic> mapped to <italic>Y<sub>Tx</sub></italic> for the 10 diseases (microaveraging) [<xref ref-type="bibr" rid="ref43">43</xref>], MetaMap had an F-measure=80.00% with precision=77.00% and recall=83.25%. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> has the detailed results for NER subtasks, including an investigation of the UMLS semantic types for <italic>Y<sub>Tx</sub></italic>.</p>
        <p><xref ref-type="table" rid="table2">Table 2</xref> contains the <italic>NER winners</italic>, that is, the search query <italic>-x +z1 +z2</italic> for the 3CosAdd formula per model and disease target <italic>x</italic> having the maximum observed values for n2 or n3.</p>
        <list list-type="bullet">
          <list-item>
            <p>The maximum observed value for n2 was the highest possible value, that is, n2=12, for both CBOW and Skip-gram.</p>
          </list-item>
          <list-item>
            <p>The maximum observed value for n3 was for the search query, <italic>−epilepsy +valproate +AED</italic>. However, the number of different <italic>Y<sub>Tx</sub></italic> (excluding Z1 and Z2) differed, that is, n3=11 for Skip-gram and n3=10 for CBOW.</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Stage 3: Knowledge Validation (Validating Statements)</title>
        <p><xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 3) has the 569 unique UMLS Metathesaurus concept pairs (<italic>X,Y<sub>Tx</sub></italic>) mapped to the unique 954 n-gram pairs (<italic>x,y<sub>Tx</sub></italic>). Although the UMLS related concepts table (file=MRREL) [<xref ref-type="bibr" rid="ref58">58</xref>] contains relationships asserted by source vocabularies between CUI pairs, only 68 of the 569 CUI pairs appeared within the MRREL table of 2019AA UMLS release.</p>
        <p>Manual searches in the literature proved to be time-consuming and labor-intensive; thus, not all the concept pairs for the target disease anemia and hypertension had evidence. Hence, we limited the study to 408 UMLS CUI pairs (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), and only 59 of these were within the MRREL table (column J of <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> worksheet Stage 3).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>NER winners per target disease x (search query -x +z1 +z2) for the 3CosAdd formula, that is, the highest value for n2 or n3 per model and per disease target x.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="80"/>
            <col width="50"/>
            <col width="50"/>
            <col width="330"/>
            <col width="250"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <thead>
              <tr valign="top">
                <td>Disease target <italic>x</italic></td>
                <td>Model</td>
                <td>NER max (n2)</td>
                <td>NER max (n3)</td>
                <td>Treatment <italic>z1</italic> search query</td>
                <td>Treatment <italic>z2</italic> search query</td>
                <td>n1</td>
                <td>n2</td>
                <td>n3</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>heart_failure</td>
                <td>CBOW<sup>a</sup></td>
                <td>Yes</td>
                <td>N/A<sup>b</sup></td>
                <td>angiotensin-converting_enzyme_(ACE)_inhibitors</td>
                <td>aldosterone_antagonists</td>
                <td>2</td>
                <td>12</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>heart_failure</td>
                <td>CBOW</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>cardiac_resynchronization_therapy_(CRT)</td>
                <td>aldosterone_antagonists</td>
                <td>2</td>
                <td>10</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>heart_failure</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>beta-blockers</td>
                <td>aldosterone_antagonists</td>
                <td>2</td>
                <td>12</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>glaucoma</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>trabeculectomy</td>
                <td>cataract_surgery</td>
                <td>2</td>
                <td>5</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>glaucoma</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>trabeculectomy</td>
                <td>cataract_surgery</td>
                <td>2</td>
                <td>10</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>CKD<sup>c</sup></td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>not_requiring_dialysis</td>
                <td>dialysis</td>
                <td>1</td>
                <td>9</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>CKD</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>not_requiring_dialysis</td>
                <td>dialysis</td>
                <td>1</td>
                <td>8</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>diabetes</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>glucose_variability</td>
                <td>glucagon-like_peptide-1_receptor_agonists</td>
                <td>2</td>
                <td>10</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>diabetes</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>glucose_variability</td>
                <td>glucagon-like_peptide-1_receptor_agonists</td>
                <td>2</td>
                <td>10</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>asthma</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>N/A</td>
                <td>inhaled_corticosteroid</td>
                <td>LABAs<sup>d</sup></td>
                <td>2</td>
                <td>11</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>asthma</td>
                <td>CBOW</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>inhaled_corticosteroids</td>
                <td>inhaled_corticosteroid</td>
                <td>1</td>
                <td>10</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>asthma</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>anti-LTs</td>
                <td>LABAs</td>
                <td>2</td>
                <td>12</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>epilepsy</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>valproate</td>
                <td>AED<sup>e</sup></td>
                <td>2</td>
                <td>12</td>
                <td>10</td>
              </tr>
              <tr valign="top">
                <td>epilepsy</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>valproate</td>
                <td>AED</td>
                <td>2</td>
                <td>12</td>
                <td>11</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>plus_methotrexate</td>
                <td>methotrexate</td>
                <td>1</td>
                <td>12</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>methotrexate</td>
                <td>DMARDs<sup>f</sup></td>
                <td>2</td>
                <td>11</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>CBOW</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>hyaluronic_acid</td>
                <td>glucosamine</td>
                <td>2</td>
                <td>8</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>N/A</td>
                <td>knee_arthroplasty</td>
                <td>hyaluronic_acid</td>
                <td>2</td>
                <td>9</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>CBOW</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>vs_acetaminophen</td>
                <td>glucosamine</td>
                <td>2</td>
                <td>8</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>vs_acetaminophen</td>
                <td>hyaluronic_acid</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>iron</td>
                <td>erythropoiesis-stimulating_agents</td>
                <td>2</td>
                <td>11</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>N/A</td>
                <td>blood_transfusions</td>
                <td>ESAs<sup>g</sup></td>
                <td>2</td>
                <td>12</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>Skip-gram</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>recombinant_human_erythropoietin</td>
                <td>iron</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>hypertension</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>N/A</td>
                <td>antihypertensive_drugs</td>
                <td>angiotensin_receptor_blockers</td>
                <td>2</td>
                <td>12</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>hypertension</td>
                <td>CBOW</td>
                <td>N/A</td>
                <td>Yes</td>
                <td>antihypertensive_therapy</td>
                <td>antihypertensive</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>hypertension</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>antihypertensive_drug_classes</td>
                <td>antihypertensive</td>
                <td>1</td>
                <td>12</td>
                <td>10</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>CBOW: Continuous Bag-of-Words.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>CKD: chronic kidney disease.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>LABA: long-acting beta2-agonist.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>AED: antiepileptic drug.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>DMARD: disease-modifying antirheumatic drug.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>ESA: erythropoiesis-stimulating agent.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the 7 evidence-based categories assigned to the 408 UMLS CUI pairs investigated thoroughly. There are 19 concept pairs (<italic>X,Y<sub>Tx</sub></italic>) with more than 1 evidence-based category, such as the concept pair (<italic>X</italic>=C0014544&#124;Epilepsy,<italic>Y<sub>Tx</sub></italic>=C0080356&#124;Valproate). The evidence-based category “Tx with therapeutic effect” has the highest number of CUI pairs, with 190 pairs (<italic>X,Y<sub>Tx</sub></italic>), where 117 pairs have evidence (quotes) taken from BMJ Best Practice. The evidence-based category “correlation” has the highest number of evidence-based information sources with 108 uniform resource identifiers of the total 238. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> has further details.</p>
        <p>Table 4 shows the <italic>clinical winners</italic>, that is, search query -x +z1 +z2 (a type of 4-term analogy) with the maximum observed number for n4 per target disease x. <xref ref-type="table" rid="table4">Table 4</xref> reveals that an <italic>NER winner</italic> is not necessarily a <italic>clinical winner</italic>, that is, the maximum observed value for n4 does not always correspond to the maximum observed value for n3 or n2.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>The 408 unified medical language system concept unique identifier pairs investigated thoroughly and their evidence-based information sources per evidence-based category.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="310"/>
            <col width="130"/>
            <col width="300"/>
            <col width="260"/>
            <thead>
              <tr valign="top">
                <td>Evidence-based categories for concept Y<sub>Tx</sub> correlated with concept X</td>
                <td>Number of CUI<sup>a</sup> pairs</td>
                <td>Number of evidence-based information sources (ie, URIs<sup>b</sup>) for CUI pairs</td>
                <td>Number of CUI pairs with BMJ Best Practice as evidence source</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Tx with therapeutic effect</td>
                <td>190</td>
                <td>73</td>
                <td>117</td>
              </tr>
              <tr valign="top">
                <td>Tx with uncertain therapeutic effect</td>
                <td>38</td>
                <td>22</td>
                <td>11</td>
              </tr>
              <tr valign="top">
                <td>Tx with unwanted or adverse effects (ie, nontherapeutic)</td>
                <td>52</td>
                <td>41</td>
                <td>17</td>
              </tr>
              <tr valign="top">
                <td>Potential Tx (under research and development)</td>
                <td>5</td>
                <td>5</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>Tx ingredient</td>
                <td>22</td>
                <td>21</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>General medical term</td>
                <td>26</td>
                <td>0</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>Correlation</td>
                <td>94</td>
                <td>108</td>
                <td>19</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>CUI: concept unique identifier.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>URI: Universal Resource Identifier.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>In <xref ref-type="table" rid="table4">Table 4</xref>, there are two rows that are not <italic>clinical winners</italic> according to the observer O2. All rows except two are <italic>clinical winners</italic> according to the 3 domain experts and both observers.</p>
        <p>Considering the 408 concept pairs (<italic>X,Y<sub>Tx</sub></italic>) with evidence, observer O1 disagrees with 25 of them, and observer O2 disagrees with 26 of them. The Cohen kappa of −0.023 is paradoxical [<xref ref-type="bibr" rid="ref59">59</xref>-<xref ref-type="bibr" rid="ref61">61</xref>], resolved in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> following Cicchetti DV and Feinstein AR [<xref ref-type="bibr" rid="ref61">61</xref>].</p>
        <p><xref ref-type="table" rid="table5">Table 5</xref> shows how the evidence-based category “Tx with therapeutic effect” assigned by an observer (when in disagreement) affects the <italic>clinical winners</italic> from <xref ref-type="table" rid="table4">Table 4</xref>. For observer O1, the only change was a decrease of n4 from 5 (<xref ref-type="table" rid="table4">Table 4</xref>) to 4 (<xref ref-type="table" rid="table5">Table 5</xref>) in the search query, <italic>−anaemia +recombinant_human_erythropoietin +iron</italic>, for Skip-gram. The observer O2 provided additional therapeutic evidence from BMJ Best Practice when in disagreement, typically increasing n4 or making “new” <italic>clinical winner</italic>s (eg, search query, <italic>−epilepsy +valproate +levetiracetam</italic>).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Clinical winners (highest value of n4) per model and disease target x considering the 3 domain experts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="70"/>
            <col width="60"/>
            <col width="50"/>
            <col width="340"/>
            <col width="200"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <thead>
              <tr valign="top">
                <td>Disease target <italic>x</italic></td>
                <td>Model</td>
                <td>NER max (n2)</td>
                <td>NER max (n3)</td>
                <td>Treatment <italic>z1</italic> search query</td>
                <td>Treatment <italic>z2</italic> search query</td>
                <td>n1</td>
                <td>n2</td>
                <td>n3</td>
                <td>n4</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>heart_failure</td>
                <td>CBOW<sup>a</sup></td>
                <td>—</td>
                <td>Yes</td>
                <td>cardiac_resynchronization_therapy_(CRT)</td>
                <td>aldosterone_antagonists</td>
                <td>2</td>
                <td>10</td>
                <td>9</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>heart_failure</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>beta-blockers</td>
                <td>aldosterone_antagonists</td>
                <td>2</td>
                <td>12</td>
                <td>8</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>glaucoma</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>trabeculectomy</td>
                <td>cataract_surgery</td>
                <td>2</td>
                <td>5</td>
                <td>5</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>glaucoma</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>trabeculectomy</td>
                <td>cataract_surgery</td>
                <td>2</td>
                <td>10</td>
                <td>6</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>CKD<sup>b</sup></td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>not_requiring_dialysis</td>
                <td>dialysis</td>
                <td>1</td>
                <td>9</td>
                <td>7</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>CKD</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>not_requiring_dialysis</td>
                <td>dialysis</td>
                <td>1</td>
                <td>8</td>
                <td>5</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>diabetes</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>glucose_variability</td>
                <td>glucagon-like_peptide-1_receptor_agonists</td>
                <td>2</td>
                <td>10</td>
                <td>6</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>diabetes</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>glucose_variability</td>
                <td>glucagon-like_peptide-1_receptor_agonists</td>
                <td>2</td>
                <td>10</td>
                <td>5</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>asthma</td>
                <td>CBOW</td>
                <td>—</td>
                <td>Yes</td>
                <td>inhaled_corticosteroids</td>
                <td>inhaled_corticosteroid</td>
                <td>1</td>
                <td>10</td>
                <td>8</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>asthma</td>
                <td>Skip-gram</td>
                <td>—</td>
                <td>—</td>
                <td>inhaled_corticosteroids</td>
                <td>inhaled_corticosteroid</td>
                <td>1</td>
                <td>11</td>
                <td>8</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>epilepsy</td>
                <td>CBOW</td>
                <td>—</td>
                <td>—</td>
                <td>valproate</td>
                <td>antiepileptic_drug</td>
                <td>2</td>
                <td>11</td>
                <td>10</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>epilepsy</td>
                <td>CBOW</td>
                <td>—</td>
                <td>—</td>
                <td>valproate</td>
                <td>antiepileptic_drugs</td>
                <td>2</td>
                <td>11</td>
                <td>10</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>epilepsy<sup>c</sup></td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>valproate</td>
                <td>AED<sup>d</sup></td>
                <td>2</td>
                <td>12</td>
                <td>11</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>plus_methotrexate</td>
                <td>methotrexate</td>
                <td>1</td>
                <td>12</td>
                <td>9</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>arthritis<sup>c</sup></td>
                <td>Skip-gram</td>
                <td>—</td>
                <td>—</td>
                <td>plus_methotrexate</td>
                <td>methotrexate</td>
                <td>1</td>
                <td>7</td>
                <td>4</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>—</td>
                <td>knee_arthroplasty</td>
                <td>hyaluronic_acid</td>
                <td>2</td>
                <td>9</td>
                <td>7</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>osteoarthritis</td>
                <td>Skip-gram</td>
                <td>—</td>
                <td>—</td>
                <td>vs_acetaminophen</td>
                <td>viscosupplementation</td>
                <td>2</td>
                <td>7</td>
                <td>8</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>CBOW</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>iron</td>
                <td>erythropoiesis-stimulating_agents</td>
                <td>2</td>
                <td>11</td>
                <td>9</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>Skip-gram</td>
                <td>—</td>
                <td>Yes</td>
                <td>recombinant_human_erythropoietin</td>
                <td>iron</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>hypertension</td>
                <td>CBOW</td>
                <td>—</td>
                <td>Yes</td>
                <td>antihypertensive_therapy</td>
                <td>antihypertensive</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>hypertension</td>
                <td>Skip-gram</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>antihypertensive_drug_classes</td>
                <td>antihypertensive</td>
                <td>1</td>
                <td>12</td>
                <td>10</td>
                <td>8</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>CBOW: Continuous Bag-of-Words.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>CKD: chronic kidney disease.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Not <italic>clinical winners</italic> according to O2.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>AED: antiepileptic drug.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Changes in clinical winners (highest value of n4) per model and disease target x considering observer O1 and O2.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="90"/>
            <col width="240"/>
            <col width="250"/>
            <col width="150"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <col width="50"/>
            <thead>
              <tr valign="top">
                <td>Disease target <italic>x</italic></td>
                <td>Model</td>
                <td>Differences in <italic>clinical winner</italic> max (n4) according to observers</td>
                <td>Treatment <italic>z1</italic> search query</td>
                <td>Treatment <italic>z2</italic> search query</td>
                <td>n1</td>
                <td>n2</td>
                <td>n3</td>
                <td>n4</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>epilepsy</td>
                <td>Skip-gram</td>
                <td>Observer O2<sup>a</sup>: New</td>
                <td>valproate</td>
                <td>levetiracetam</td>
                <td>2</td>
                <td>10</td>
                <td>9</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>CBOW<sup>b</sup></td>
                <td>Observer O2: n4 different</td>
                <td>plus_methotrexate</td>
                <td>methotrexate</td>
                <td>1</td>
                <td>12</td>
                <td>9</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>CBOW</td>
                <td>Observer O2: New</td>
                <td>methotrexate</td>
                <td>DMARDs<sup>c</sup></td>
                <td>2</td>
                <td>11</td>
                <td>9</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>Skip-gram</td>
                <td>Observer O2: New</td>
                <td>IACI<sup>d</sup></td>
                <td>DMARDs</td>
                <td>2</td>
                <td>9</td>
                <td>6</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>arthritis</td>
                <td>Skip-gram</td>
                <td>Observer O2: New</td>
                <td>plus_methotrexate</td>
                <td>DMARDs</td>
                <td>2</td>
                <td>10</td>
                <td>6</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>anaemia</td>
                <td>Skip-gram</td>
                <td>Observer O1<sup>e</sup>: n4 different</td>
                <td>recombinant_human_erythropoietin</td>
                <td>iron</td>
                <td>2</td>
                <td>11</td>
                <td>8</td>
                <td>4</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>O2: BMJ health informatician who works with BMJ Best Practice content and has a junior doctor background.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>CBOW: Continuous Bag-of-Words.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>DMARD: disease-modifying antirheumatic drug.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>IACI: intra-articular corticosteroid injection.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>O1: medical consultant.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> has the best <italic>clinical winner,</italic> which is an <italic>NER winner</italic>. <xref ref-type="table" rid="table6">Table 6</xref> shows the best <italic>clinical winner</italic> that is not an <italic>NER winner</italic>. <xref ref-type="table" rid="table6">Table 6</xref> illustrates the enrichment of the candidate n-grams <italic>y</italic> with domain knowledge meaning (Stage 2 normalizes n-grams with UMLS CUIs) and biomedical evidence ratified with an audit (Stage 3). The evidence provided for the evidence-based categories (quotes with references from the biomedical literature) is presented in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 3).</p>
        <p>In conclusion, considering the <italic>clinical winners</italic> found (<xref ref-type="table" rid="table4">Table 4</xref>), the answer to Q3 is “yes,” that is, the 4-term type of analogies discovered in a small common-English corpus can also be discovered in a large-scale biomedical corpus.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Illustration of a Best clinical winner with max (n4)=8 for CBOW and disease target x = epilepsy, which is not an NER winner.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="70"/>
            <col width="240"/>
            <col width="110"/>
            <col width="310"/>
            <col width="270"/>
            <thead>
              <tr valign="top">
                <td>Rank<sup>a</sup></td>
                <td>Candidate <italic>y</italic></td>
                <td>3CosAdd</td>
                <td>UMLS CUI for concept <italic>Y</italic><sub><italic>Tx</italic></sub> mapped to candidate <italic>y</italic><sub><italic>Tx</italic></sub></td>
                <td>Evidence-based categories for concept <italic>Y</italic><sub><italic>Tx</italic></sub> correlated with concept <italic>X</italic></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>lamotrigine</td>
                <td>0.385201</td>
                <td>C0064636</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>carbamazepine</td>
                <td>0.345227</td>
                <td>C0006949</td>
                <td>Tx with unwanted or adverse effects (ie, nontherapeutic)</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>low_propensity</td>
                <td>0.324285</td>
                <td>—<sup>b</sup></td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>clonazepam</td>
                <td>0.310706</td>
                <td>C0009011</td>
                <td>Tx with uncertain therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>topiramate</td>
                <td>0.308402</td>
                <td>C0076829</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>lithium_valproate</td>
                <td>0.308223</td>
                <td>C0023870&#124;C0080356</td>
                <td>Tx with therapeutic effect&#124;Tx with unwanted or adverse effects (ie, nontherapeutic)</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>clobazam</td>
                <td>0.306901</td>
                <td>C0055891</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>sodium_valproate</td>
                <td>0.300513</td>
                <td>C0037567</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>lorazepam</td>
                <td>0.29562</td>
                <td>C0024002</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>lithium</td>
                <td>0.294804</td>
                <td>C0023870</td>
                <td>Tx with therapeutic effect&#124;Tx with unwanted or adverse effects (ie nontherapeutic)</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>gabapentin_pregabalin_topiramate</td>
                <td>0.291698</td>
                <td>C0657912&#124;C0076829&#124;C0060926</td>
                <td>Tx with therapeutic effect</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>antiepileptic_drugs_other_than</td>
                <td>0.290046</td>
                <td>C0003299</td>
                <td>Tx with therapeutic effect</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>The search query −x +z1 +z2 is listed in <xref ref-type="table" rid="table4">Table 4</xref>, which is −epilepsy +valproate +antiepileptic_drug. The character “&#124;” appears when there is more than 1 CUI or evidence-based category.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>The candidate y = “low_propensity” does not belong to the semantic field Tx, and so, it has no UMLS CUI assigned.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Answer Q4: An Empirical Heuristic with Some Predictive Power for Clinical Winners</title>
        <p><xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Q4) has the 304 search queries of the total of 446 (223 for CBOW and 223 for Skip-gram) queries, where all the candidates <italic>y<sub>Tx</sub></italic> mapped to concepts <italic>Y<sub>Tx</sub></italic> have at least one evidence-based category assigned. <xref ref-type="boxed-text" rid="box2">Textbox 2</xref> summarizes the empirical heuristic developed by visual inspection, focusing on rows with the minimum (n4=0) and the maximum observed values of n4. The heuristic is programmatically implemented as a Boolean expression composed of 3 expressions with the Boolean AND.</p>
        <boxed-text id="box2" position="float">
          <title>An empirical heuristic developed by visual inspection with some predictive power for the clinical winners.</title>
          <list list-type="order">
            <list-item>
              <p>Avoid n-grams <italic>z1</italic> and <italic>z2</italic> having short forms</p>
            </list-item>
            <list-item>
              <p>Favor n-grams <italic>z1</italic> or <italic>z2</italic> (or both) not appearing among the 20 top-ranked candidates for target <italic>x</italic> with the highest value for cosine with Skip-gram embeddings</p>
            </list-item>
            <list-item>
              <p>Favor n-gram <italic>z2</italic> with frequency counts in the corpus &#62;100</p>
            </list-item>
          </list>
        </boxed-text>
        <p>The heuristic selects 93 of the 304 search queries, which brings 126 of the 190 UMLS Metathesaurus concepts <italic>Y<sub>Tx</sub></italic> with the evidence-based category “Tx with therapeutic effect,” that is, <italic>Y<sub>Tx</sub></italic> with therapeutic intent.</p>
        <p><xref ref-type="table" rid="table7">Table 7</xref> (source data in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) shows the performance of the heuristic considering (1) the values of n4 (the last 3 yellow columns in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> worksheet Q4), (2) the different thresholds for n4, and (3) precision and recall as metric.</p>
        <p>Considering the precision and recall values for the empirical heuristic (<xref ref-type="table" rid="table7">Table 7</xref>), the answer to Q4 is also “yes,” that is, some predictive power over the <italic>clinical winners</italic> obtained is possible.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Precision and recall for the empirical heuristic developed using <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Q4).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="200"/>
            <col width="200"/>
            <col width="210"/>
            <col width="150"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Threshold</td>
                <td>True positive (TP)</td>
                <td>False positive (FP)</td>
                <td>False negative (FN)</td>
                <td>Precision<sup>a</sup> %</td>
                <td>Recall<sup>b</sup> %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>n4&#62;0</td>
                <td>91</td>
                <td>2</td>
                <td>189</td>
                <td>97.85</td>
                <td>32.5</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;1</td>
                <td>84</td>
                <td>9</td>
                <td>151</td>
                <td>90.32</td>
                <td>35.74</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;2</td>
                <td>73</td>
                <td>20</td>
                <td>111</td>
                <td>78.49</td>
                <td>39.67</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;3</td>
                <td>48</td>
                <td>45</td>
                <td>76</td>
                <td>51.61</td>
                <td>38.71</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;4</td>
                <td>28</td>
                <td>65</td>
                <td>52</td>
                <td>30.11</td>
                <td>35</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;5</td>
                <td>14</td>
                <td>79</td>
                <td>20</td>
                <td>15.05</td>
                <td>41.18</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;6</td>
                <td>9</td>
                <td>84</td>
                <td>5</td>
                <td>9.68</td>
                <td>64.29</td>
              </tr>
              <tr valign="top">
                <td>n4&#62;7</td>
                <td>4</td>
                <td>89</td>
                <td>0</td>
                <td>4.3</td>
                <td>100</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>Precision: calculated as TP/(TP+FP).</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>Recall: calculated as TP/(TP+FN).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Humans can agree that the semantic field <italic>person</italic> {you; Romeo} is related to the semantic field <italic>death</italic> {die; died; dagger} in the context of Shakespeare’s Romeo. Hence, we answer Q1 and Q2 with a “yes”; therefore, analogical reasoning with CBOW embeddings seems feasible with a small common-English corpus. This challenges the current assumption that “learning in current deep learning models relies on massive data” [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>We answered Q3 by demonstrating that there is proof of the generalization; thus, the 3CosAdd formula can discover another type of 4-term analogy that is not a pair-based proportional analogy. Furthermore, we have proven that the analogical inferences sanctioned by the 3CosAdd formula with embeddings could extract treatments with therapeutic intent from free text. Indeed, there were strong examples of analogical reasoning with abstract semantic relations between <italic>z1</italic> and <italic>z2</italic> among <italic>clinical winners</italic> (<xref ref-type="table" rid="table4">Table 4</xref>):</p>
        <list list-type="bullet">
          <list-item>
            <p><italic>Antonym.</italic> The search query, <italic>−CKD +not_requiring_dialysis +dialysis</italic>, with n4=5 for CBOW and Skip-gram.</p>
          </list-item>
          <list-item>
            <p><italic>Synonym.</italic> The search query, <italic>−asthma +inhaled_corticosteroids +inhaled_corticosteroid</italic>, with n4=8 for CBOW (the best <italic>clinical winner</italic>) and n4=7 for Skip-gram, where the relation between <italic>z2</italic> and <italic>z1</italic> was inflectional morphology <italic>singular:plural</italic>. This query resembled the search query, <italic>−Romeo +die +died</italic>.</p>
          </list-item>
          <list-item>
            <p><italic>Category membership</italic>. The search query, <italic>−epilepsy +valproate +antiepileptic_drug</italic>, with n4=8 for CBOW. The search query, <italic>−hypertension +antihypertensive_drug_classes +antihypertensive</italic>, with n4=8 for Skip-gram. Both search queries were the best <italic>clinical winners</italic> (maximum observed value for n4).</p>
          </list-item>
          <list-item>
            <p><italic>Commonalities in structural features</italic>. All search queries focused on the therapeutic intent of <italic>z1</italic> and <italic>z2</italic> for target disease <italic>x</italic>. However, some queries did not have the above abstract semantic relationships between <italic>z1</italic> and <italic>z2</italic>. For example, the search queries <italic>−osteoarthritis +knee_arthroplasty +hyaluronic_acid</italic> with n4=5 for CBOW and <italic>−heart_failure +beta-blockers +aldosterone_antagonists</italic> with n4=5 for Skip-gram.</p>
          </list-item>
        </list>
        <p>We answered Q4 by demonstrating that it is feasible to gain some predictive power for the <italic>clinical winners</italic>; therefore, a tactic preference was latent promising systematicity [<xref ref-type="bibr" rid="ref6">6</xref>]. <xref ref-type="boxed-text" rid="box3">Textbox 3</xref> highlights the precision and recall values for 3 n4 thresholds of the overall performance of the empirical heuristic developed by visual inspection.</p>
        <boxed-text id="box3" position="float">
          <title>Empirical heuristic performance for 304 search queries with all candidate concepts <italic>Y<sub>Tx</sub></italic> with evidence.</title>
          <list list-type="bullet">
            <list-item>
              <p>With a threshold n4 &#62;7, the recall is 100%. All search queries with n4 &#62;7 (the best <italic>clinical winners</italic>) are selected by the heuristic. The precision was 4.30% (the lowest value).</p>
            </list-item>
            <list-item>
              <p>With a threshold n4 &#62;0 (at least one <italic>Y<sub>Tx</sub></italic> with therapeutic intent), the precision was 97.85% (the highest value) and the recall was 32.50%.</p>
              <p/>
              <p/>
            </list-item>
            <list-item>
              <p>With a threshold n4 &#62;2, where 3 was the lowest value among the <italic>clinical winners</italic> (<xref ref-type="table" rid="table3">Tables 3</xref> and <xref ref-type="table" rid="table4">4</xref>), the precision was 78.49% and the recall was 39.67%.</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our work relies on semantic fields and has 2 main limitations [<xref ref-type="bibr" rid="ref62">62</xref>]: (1) there are overlaps of meaning and (2) there are gaps in meaning. This has 2 clear implications for the lists of concepts <italic>Y<sub>Tx</sub></italic> per disease x:</p>
        <list list-type="bullet">
          <list-item>
            <p>The lists may not comprise mutually exclusive concepts in meaning. For example, “C0060657&#124;formoterol” and “C1276807&#124;Budesonide/formoterol” are both treatments with evidence of therapeutic intent for asthma [<xref ref-type="bibr" rid="ref63">63</xref>].</p>
          </list-item>
          <list-item>
            <p>The lists were incomplete. For example, “C0772501&#124;Levalbuterol” and “C0907850&#124;ciclesonide” are both treatments with evidence of therapeutic intent for asthma [<xref ref-type="bibr" rid="ref63">63</xref>] and not among the <italic>Y<sub>Tx</sub></italic> for asthma.</p>
          </list-item>
        </list>
        <p>We did not use Skip-gram with negative sampling (also known as SGNS); therefore, it can be argued that we did not use the best configuration of a word2vec model [<xref ref-type="bibr" rid="ref21">21</xref>]. The effect of hyperparameter configurations appeared in studies by Levy et al and Chiu et al [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref65">65</xref>], and Allen and Hospedales [<xref ref-type="bibr" rid="ref66">66</xref>] reviewed mathematical proofs and equations with an emphasis on SGNS for pair-based proportional analogies.</p>
        <p>For Stage 1, the 3CosAdd formula needed at least two n-gram pairs (disease <italic>x</italic>, treatment <italic>z</italic>) [<xref ref-type="bibr" rid="ref29">29</xref>]. Only one search query could be made for the target disease, chronic kidney disease and diabetes, and none for obesity. Other studies that replicated the application to the 3CosAdd formula for target disease <italic>x</italic> could suffer the same limitation. For example, in Appendix B in the study by Pakhomov et al [<xref ref-type="bibr" rid="ref67">67</xref>], among the 100 top-ranked candidate terms (highest cosine value) “semantically similar or related” to target disease “heart failure”, there were no treatments (ie, Tx encompassing 3 textual definitions from Hart et al [<xref ref-type="bibr" rid="ref24">24</xref>]).</p>
        <p>For Stage 2, the MetaMap version was 2016v2 (with a 2016 UMLS release), and few n-grams were considered as clear terminological gaps. The n-gram “anti-VEGF_agents” was manually mapped to CUI=C4727875, which exists in the 2019AA UMLS release. Five n-grams were mapped to very broad CUIs as they had the character “*” in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> (worksheet Stage 3).</p>
        <p>The NER task (Stage 2) and the searchers in the literature seeking evidence for concept pairs (Stage 3) were time-consuming and required highly trained domain experts. The appraisal of the literature was not performed by a review team as proficient as the ones conducting Cochrane systematic reviews.</p>
        <p>The heuristic developed by visual inspection lacked finesse, and its improvement calls for further investigation.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>The UMLS CUIs were mapped to SNOMED CT identifiers [<xref ref-type="bibr" rid="ref30">30</xref>]. From a “digital health care” perspective [<xref ref-type="bibr" rid="ref68">68</xref>], the UK NHS is moving toward the adoption of SNOMED CT as the only terminology for all care settings [<xref ref-type="bibr" rid="ref69">69</xref>]. A subset of SNOMED CT concepts under worldwide adoption is the CORE Problem List Subset of SNOMED CT [<xref ref-type="bibr" rid="ref70">70</xref>], and the UK NHS has developed 2 human-readable SNOMED CT subsets [<xref ref-type="bibr" rid="ref71">71</xref>]: UK Clinical Extension and UK Drug Extension. However, SNOMED CT lacks statements representing the treatments that can be considered for a disease (eg, inhaled corticosteroid treats asthma) and, to the best of the authors’ knowledge, there are no SNOMED CT subsets for well-known diseases.</p>
        <p>There are reusable datasets for evaluating relatedness made of UMLS CUI pairs:</p>
        <list list-type="bullet">
          <list-item>
            <p>Medical coders set [<xref ref-type="bibr" rid="ref72">72</xref>]: 101 CUI pairs mapped to terms, typically multiple words. Only 29 pairs have a high interrater agreement.</p>
          </list-item>
          <list-item>
            <p>Medical Residents Relatedness Set [<xref ref-type="bibr" rid="ref73">73</xref>]: 588 CUI pairs mapped to terms, typically single words. Using single words is a severe limitation as “most medical terms consist of more than one word” [<xref ref-type="bibr" rid="ref67">67</xref>].</p>
          </list-item>
          <list-item>
            <p>UMLS MRREL table [<xref ref-type="bibr" rid="ref58">58</xref>]: It has relationships asserted by source vocabularies between CUI pairs. Among the relationship attributes appear the following: “may_prevent”, “may_treat”, and “has_contraindicated_drug”.</p>
          </list-item>
        </list>
        <p>All reusable datasets mentioned above lack evidence (quotes with references) from the biomedical literature. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> cross-compares these reusable datasets and the 408 UMLS CUI pairs investigated thoroughly in this study.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Extracting clinically useful information automatically from free text in PubMed/MEDLINE may require a natural language understanding of statements containing relevant relations for health care. Hence, extracting treatments with therapeutic intent by analogical reasoning from embeddings (423K n-grams from the PMSB dataset) is an ambitious goal. Our SemDeep approach is knowledge-based, underpinned by embedding analogies that exploit prior knowledge. Biomedical facts from embedding analogies (a 4-term type, not pairwise) are potentially useful for clinicians. The heuristic offers a practical way to discover beneficial treatments for well-known diseases.</p>
        <p>Learning from deep learning models does not require a massive amount of data. Embedding analogies are not limited to pairwise analogies; hence, analogical reasoning with embeddings is underexploited.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Additional material.</p>
        <media xlink:href="medinform_v8i8e16948_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 378 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Data to replicate the results reported.</p>
        <media xlink:href="medinform_v8i8e16948_app2.xls" xlink:title="XLS File  (Microsoft Excel File), 708 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BMJ</term>
          <def>
            <p>British Medical Journal</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CBOW</term>
          <def>
            <p>Continuous Bag-of-Words</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CUI</term>
          <def>
            <p>concept unique identifier</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MRREL</term>
          <def>
            <p>the UMLS related concepts table (file=MRREL)</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NHS</term>
          <def>
            <p>National Health Service</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PMSB</term>
          <def>
            <p>PubMed systematic reviews subset</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SemDeep</term>
          <def>
            <p>Semantic Deep Learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SGNS</term>
          <def>
            <p>skip-gram with negative sampling</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SNOMED CT</term>
          <def>
            <p>systematized nomenclature of medicine - clinical terms</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">Tx</term>
          <def>
            <p>treatment</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">UMLS</term>
          <def>
            <p>unified medical language system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">URIs</term>
          <def>
            <p>Universal Resource Identifiers</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank Tim Furmston (IT Research, University of Manchester, United Kingdom) for help with the software and electronic infrastructure.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>CW works for BMJ which produces the clinical decision support tool BMJ Best Practice. All other authors have no conflict of interest to declare.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masic</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Miokovic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Muhamedagic</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Evidence based medicine - new approaches and challenges</article-title>
          <source>Acta Inform Med</source>
          <year>2008</year>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>219</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24109156"/>
          </comment>
          <pub-id pub-id-type="doi">10.5455/aim.2008.16.219-225</pub-id>
          <pub-id pub-id-type="medline">24109156</pub-id>
          <pub-id pub-id-type="pmcid">PMC3789163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Avorn</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The psychology of clinical decision making - implications for medication use</article-title>
          <source>N Engl J Med</source>
          <year>2018</year>
          <month>03</month>
          <day>22</day>
          <volume>378</volume>
          <issue>8</issue>
          <fpage>689</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMp1714987</pub-id>
          <pub-id pub-id-type="medline">29466158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>YN</given-names>
            </name>
            <name name-style="western">
              <surname>Holyoak</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Emergence of analogy from relation learning</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2019</year>
          <month>03</month>
          <day>5</day>
          <volume>116</volume>
          <issue>10</issue>
          <fpage>4176</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=30770443"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1814779116</pub-id>
          <pub-id pub-id-type="medline">30770443</pub-id>
          <pub-id pub-id-type="pii">1814779116</pub-id>
          <pub-id pub-id-type="pmcid">PMC6410800</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>LeCun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Deep learning</article-title>
          <source>Nature</source>
          <year>2015</year>
          <month>05</month>
          <day>28</day>
          <volume>521</volume>
          <issue>7553</issue>
          <fpage>436</fpage>
          <lpage>44</lpage>
          <pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
          <pub-id pub-id-type="medline">26017442</pub-id>
          <pub-id pub-id-type="pii">nature14539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jurafsky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Stanford University</source>
          <year>2019</year>
          <access-date>2020-06-01</access-date>
          <comment>Speech and Language Processing<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://web.stanford.edu/~jurafsky/slp3/">https://web.stanford.edu/~jurafsky/slp3/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gentner</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Markman</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Structure mapping in analogy and similarity</article-title>
          <source>Am Psychol</source>
          <year>1997</year>
          <volume>52</volume>
          <issue>1</issue>
          <fpage>45</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="doi">10.1037//0003-066x.52.1.45</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <source>ACL Anthology</source>
          <access-date>2020-06-01</access-date>
          <comment>Analogy (State of the Art)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclweb.org/aclwiki/Analogy_(State_of_the_art)">https://aclweb.org/aclwiki/Analogy_(State_of_the_art)</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schnabel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Labutov</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Mimno</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Joachims</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Evaluation Methods for Unsupervised Word Embeddings</article-title>
          <source>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2015</year>
          <conf-name>EMNLP'15</conf-name>
          <conf-date>September 17-21, 2015</conf-date>
          <conf-loc>Lisbon, Portugal</conf-loc>
          <fpage>298</fpage>
          <lpage>307</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/d15-1036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yih</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zweig</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Linguistic Regularities in Continuous Space Word Representations</article-title>
          <source>Proceedings of the 2013 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2013</year>
          <conf-name>NAACL'13</conf-name>
          <conf-date>June 9-14, 2013</conf-date>
          <conf-loc>Atlanta, Georgia, US</conf-loc>
          <fpage>746</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/N13-1090/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Drozd</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gladkova</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuoka</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Word Embeddings, Analogies, and Machine Learning: Beyond King - Man + Woman = Queen</article-title>
          <source>Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers</source>
          <year>2016</year>
          <conf-name>COLING'16</conf-name>
          <conf-date>December 11-16, 2016</conf-date>
          <conf-loc>Osaka, Japan</conf-loc>
          <fpage>3519</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/C16-1332/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Analogical inference for multi-relational embeddings</article-title>
          <source>Arxiv</source>
          <year>2017</year>
          <fpage>-</fpage>
          <comment>epub ahead of print (1705.02426)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1705.02426"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rather</surname>
              <given-names>NN</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>CO</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Using deep learning towards biomedical knowledge discovery</article-title>
          <source>Int J Math Sci Comput</source>
          <year>2017</year>
          <month>04</month>
          <day>8</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.5815/ijmsc.2017.02.01</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dynomant</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lelong</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dahamna</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Massonnaud</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kerdelhué</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grosjean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Canu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Darmoni</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Word embedding for the French natural language in health care: comparative study</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>07</month>
          <day>29</day>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>e12310</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/3/e12310/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12310</pub-id>
          <pub-id pub-id-type="medline">31359873</pub-id>
          <pub-id pub-id-type="pii">v7i3e12310</pub-id>
          <pub-id pub-id-type="pmcid">PMC6690161</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <source>BMJ Best Practice</source>
          <year>2018</year>
          <access-date>2020-06-01</access-date>
          <comment>Sepsis in Adults<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bestpractice.bmj.com/topics/en-gb/245">http://bestpractice.bmj.com/topics/en-gb/245</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gatta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Verardo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bolognesi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Hypoalbuminemia</article-title>
          <source>Intern Emerg Med</source>
          <year>2012</year>
          <month>10</month>
          <volume>7</volume>
          <issue>Suppl 3</issue>
          <fpage>S193</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1007/s11739-012-0802-0</pub-id>
          <pub-id pub-id-type="medline">23073857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <source>National Library of Medicine - National Institutes of Health - NIH</source>
          <access-date>2020-06-01</access-date>
          <comment>Search Strategy Used to Create the PubMed Systematic Reviews Filter<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/bsd/pubmed_subsets/sysreviews_strategy.html">https://www.nlm.nih.gov/bsd/pubmed_subsets/sysreviews_strategy.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <source>Special Issue on Semantic Deep Learning</source>
          <access-date>2020-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.semantic-web-journal.net/content/special-issue-semantic-deep-learning">http://www.semantic-web-journal.net/content/special-issue-semantic-deep-learning</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Bechhofer</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Ontology-based knowledge representation for bioinformatics</article-title>
          <source>Brief Bioinform</source>
          <year>2000</year>
          <month>12</month>
          <volume>1</volume>
          <issue>4</issue>
          <fpage>398</fpage>
          <lpage>414</lpage>
          <pub-id pub-id-type="doi">10.1093/bib/1.4.398</pub-id>
          <pub-id pub-id-type="medline">11465057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bartha</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <source>Stanford Encyclopedia of Philosophy</source>
          <year>2019</year>
          <access-date>2020-06-01</access-date>
          <comment>Analogy and Analogical Reasoning<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://plato.stanford.edu/archives/spr2019/entries/reasoning-analogy/">https://plato.stanford.edu/archives/spr2019/entries/reasoning-analogy/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Efficient Estimation of Word Representations in Vector Space</article-title>
          <source>Proceedings of 1st International Conference on Learning Representations</source>
          <year>2013</year>
          <conf-name>ICLR'13</conf-name>
          <conf-date>May 2-4, 2013</conf-date>
          <conf-loc>Scottsdale, Arizona, US</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1301.3781"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Linguistic Regularities in Sparse and Explicit Word Representations</article-title>
          <source>Proceedings of the Eighteenth Conference on Computational Natural Language Learning</source>
          <year>2014</year>
          <conf-name>ACL'14</conf-name>
          <conf-date>June 26-27, 2014</conf-date>
          <conf-loc>Baltimore, Maryland, USA</conf-loc>
          <fpage>171</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-1618</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nerlich</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Semantic fields and frames: historical explorations of the interface between language, action, and cognition</article-title>
          <source>J Pragmat</source>
          <year>2000</year>
          <month>01</month>
          <volume>32</volume>
          <issue>2</issue>
          <fpage>125</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1016/s0378-2166(99)00042-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <source>SNOMED Confluence</source>
          <access-date>2020-06-01</access-date>
          <comment>Technical Implementation Guide<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://snomed.org/tig">http://snomed.org/tig</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsaousides</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zanca</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Whyte</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Packel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferraro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dijkers</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Toward a theory-driven classification of rehabilitation treatments</article-title>
          <source>Arch Phys Med Rehabil</source>
          <year>2014</year>
          <month>01</month>
          <volume>95</volume>
          <issue>1 Suppl</issue>
          <fpage>S33</fpage>
          <lpage>44.e2</lpage>
          <pub-id pub-id-type="doi">10.1016/j.apmr.2013.05.032</pub-id>
          <pub-id pub-id-type="medline">24370323</pub-id>
          <pub-id pub-id-type="pii">S0003-9993(13)01045-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Reichart</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Korhonen</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>SimLex-999: evaluating semantic models with (genuine) similarity estimation</article-title>
          <source>Comput Linguist</source>
          <year>2015</year>
          <month>12</month>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>665</fpage>
          <lpage>95</lpage>
          <pub-id pub-id-type="doi">10.1162/coli_a_00237</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <source>NCBO BioPortal</source>
          <year>2020</year>
          <access-date>2020-06-01</access-date>
          <comment>Semanticscience Integrated Ontology<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bioportal.bioontology.org/ontologies/SIO">https://bioportal.bioontology.org/ontologies/SIO</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Evaluating Vector-Space Models of Analogy</article-title>
          <source>Proceedings of the 39th Annual Meeting of the Cognitive Science Society</source>
          <year>2017</year>
          <conf-name>CogSci'17</conf-name>
          <conf-date>July 26-29, 2017</conf-date>
          <conf-loc>London, UK</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <source>Google Code</source>
          <access-date>2020-06-01</access-date>
          <comment>Word2vec - Default<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://code.google.com/archive/p/word2vec/source/default/source">https://code.google.com/archive/p/word2vec/source/default/source</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arguello-Casteleiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Des-Diz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wroe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Prieto</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maroto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Maseda-Fernandez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Noble</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Dukes-McEwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Exploring semantic deep learning for building reliable and reusable one health knowledge from PubMed systematic reviews and veterinary clinical notes</article-title>
          <source>J Biomed Semantics</source>
          <year>2019</year>
          <month>11</month>
          <day>12</day>
          <volume>10</volume>
          <issue>Suppl 1</issue>
          <fpage>22</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-019-0212-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-019-0212-6</pub-id>
          <pub-id pub-id-type="medline">31711540</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-019-0212-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6849172</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The unified medical language system (UMLS): integrating biomedical terminology</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <month>01</month>
          <day>1</day>
          <volume>32</volume>
          <issue>Database issue</issue>
          <fpage>D267</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14681409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
          <pub-id pub-id-type="medline">14681409</pub-id>
          <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
          <pub-id pub-id-type="pmcid">PMC308795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <source>BMJ Best Practice</source>
          <access-date>2020-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bestpractice.bmj.com/">https://bestpractice.bmj.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <source>PubMed/MEDLINE</source>
          <access-date>2020-06-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/pubmed/">https://www.ncbi.nlm.nih.gov/pubmed/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwag</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>González-Lorenzo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Banzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bonovas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moja</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Providing doctors with high-quality information: an updated evaluation of web-based point-of-care information summaries</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>01</month>
          <day>19</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>e15</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/1/e15/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5234</pub-id>
          <pub-id pub-id-type="medline">26786976</pub-id>
          <pub-id pub-id-type="pii">v18i1e15</pub-id>
          <pub-id pub-id-type="pmcid">PMC4738183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <source>BMJ Best Practice</source>
          <access-date>2020-06-01</access-date>
          <comment>Do You Work for the NHS in England, Scotland or Wales?<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bestpractice.bmj.com/info/bmagp/">https://bestpractice.bmj.com/info/bmagp/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Landauer</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Dumais</surname>
              <given-names>ST</given-names>
            </name>
          </person-group>
          <article-title>A solution to Plato's problem: the latent semantic analysis theory of acquisition, induction, and representation of knowledge</article-title>
          <source>Psychol Rev</source>
          <year>1997</year>
          <volume>104</volume>
          <issue>2</issue>
          <fpage>211</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1037/0033-295X.104.2.211</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>3</volume>
          <issue>4-5</issue>
          <fpage>993</fpage>
          <lpage>1002</lpage>
          <pub-id pub-id-type="doi">10.1162/jmlr.2003.3.4-5.993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thomo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Engineering and Computer Science - University of Victoria</source>
          <access-date>2020-06-01</access-date>
          <comment>Latent Semantic Analysis<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.engr.uvic.ca/~seng474/svd.pdf">https://www.engr.uvic.ca/~seng474/svd.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ardila</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Meaning in language. An introduction to semantics and pragmatics</article-title>
          <source>J Pragma</source>
          <year>2011</year>
          <month>08</month>
          <volume>43</volume>
          <issue>10</issue>
          <fpage>2670</fpage>
          <lpage>2</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pragma.2011.03.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <source>Cochrane Library: Cochrane Reviews</source>
          <access-date>2020-06-01</access-date>
          <comment>Cochrane Database of Systematic Reviews<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cochranelibrary.com/cdsr/about-cdsr">https://www.cochranelibrary.com/cdsr/about-cdsr</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>World Health Organization</collab>
          </person-group>
          <source>Prevention and Control of Noncommunicable Diseases: Guidelines for Primary Health Care in Low Resource Settings</source>
          <year>2012</year>
          <publisher-loc>Geneva, Switzerland</publisher-loc>
          <publisher-name>World Health Organization</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arguello-Casteleiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>des-Diz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wroe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Prieto</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maroto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Maseda-Fernandez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Noble</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Dukes-McEwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Exploring semantic deep learning for building reliable and reusable one health knowledge from PubMed systematic reviews and veterinary clinical notes</article-title>
          <source>J Biomed Semantics</source>
          <year>2019</year>
          <month>11</month>
          <day>12</day>
          <volume>10</volume>
          <issue>Suppl 1</issue>
          <fpage>22</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-019-0212-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-019-0212-6</pub-id>
          <pub-id pub-id-type="medline">31711540</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-019-0212-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6849172</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Casteleiro</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Read</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Prieto</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maroto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Deep learning meets ontologies: experiments to anchor the cardiovascular disease ontology in the biomedical literature</article-title>
          <source>J Biomed Semantics</source>
          <year>2018</year>
          <month>04</month>
          <day>12</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>13</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-018-0181-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-018-0181-1</pub-id>
          <pub-id pub-id-type="medline">29650041</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-018-0181-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC5896136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schütze</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>Foundations of Statistical Natural Language Processing</source>
          <year>1999</year>
          <publisher-loc>New York, USA</publisher-loc>
          <publisher-name>MIT Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cañas</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>CMap</source>
          <year>2008</year>
          <access-date>2020-06-01</access-date>
          <comment>The Theory Underlying Concept Maps and How to Construct and Use Them<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cmap.ihmc.us/Publications/ResearchPapers/TheoryUnderlyingConceptMaps.pdf">http://cmap.ihmc.us/Publications/ResearchPapers/TheoryUnderlyingConceptMaps.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Ohno-Machado</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing: an introduction</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>544</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21846786"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000464</pub-id>
          <pub-id pub-id-type="medline">21846786</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3168328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yamaguchi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bono</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Allie: a database and a search service of abbreviations and long forms</article-title>
          <source>Database (Oxford)</source>
          <year>2011</year>
          <volume>2011</volume>
          <fpage>bar013</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/database/article-lookup/doi/10.1093/database/bar013"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/bar013</pub-id>
          <pub-id pub-id-type="medline">21498548</pub-id>
          <pub-id pub-id-type="pii">bar013</pub-id>
          <pub-id pub-id-type="pmcid">PMC3077826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Artstein</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Poesio</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Inter-coder agreement for computational linguistics</article-title>
          <source>Comput Linguist</source>
          <year>2008</year>
          <month>12</month>
          <volume>34</volume>
          <issue>4</issue>
          <fpage>555</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1162/coli.07-034-r2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shelley</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Krippendorff</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Content analysis: an introduction to its methodology</article-title>
          <source>J Am Stat Assoc</source>
          <year>1984</year>
          <month>03</month>
          <volume>79</volume>
          <issue>385</issue>
          <fpage>240</fpage>
          <pub-id pub-id-type="doi">10.2307/2288384</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rebholz-Schuhmann</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oellrich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoehndorf</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Text-mining solutions for biomedical research: enabling integrative biology</article-title>
          <source>Nat Rev Genet</source>
          <year>2012</year>
          <month>12</month>
          <volume>13</volume>
          <issue>12</issue>
          <fpage>829</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1038/nrg3337</pub-id>
          <pub-id pub-id-type="medline">23150036</pub-id>
          <pub-id pub-id-type="pii">nrg3337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>An overview of MetaMap: historical perspective and recent advances</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>229</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20442139"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.002733</pub-id>
          <pub-id pub-id-type="medline">20442139</pub-id>
          <pub-id pub-id-type="pii">17/3/229</pub-id>
          <pub-id pub-id-type="pmcid">PMC2995713</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <source>Guidelines Developed for Step 4: Named Entity Recognition Task</source>
          <access-date>2020-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://static-content.springer.com/esm/art%3A10.1186%2Fs13326-019-0212-6/MediaObjects/13326_2019_212_MOESM2_ESM.pdf">https://static-content.springer.com/esm/art%3A10.1186%2Fs13326-019-0212-6/MediaObjects/13326_2019_212_MOESM2_ESM.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yetisgen-Yildiz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A study of biomedical concept identification: MetaMap vs people</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>529</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728229"/>
          </comment>
          <pub-id pub-id-type="medline">14728229</pub-id>
          <pub-id pub-id-type="pii">D030003464</pub-id>
          <pub-id pub-id-type="pmcid">PMC1479976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sackett</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenberg</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>WS</given-names>
            </name>
          </person-group>
          <article-title>Evidence based medicine: what it is and what it isn't</article-title>
          <source>Br Med J</source>
          <year>1996</year>
          <month>01</month>
          <day>13</day>
          <volume>312</volume>
          <issue>7023</issue>
          <fpage>71</fpage>
          <lpage>2</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8555924"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.312.7023.71</pub-id>
          <pub-id pub-id-type="medline">8555924</pub-id>
          <pub-id pub-id-type="pmcid">PMC2349778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sager</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>A Practical Course in Terminology Processing</source>
          <year>1990</year>
          <publisher-loc>Amsterdam, The Netherlands</publisher-loc>
          <publisher-name>John Benjamins Publishing</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A coefficient of agreement for nominal scales</article-title>
          <source>Educ Psychol Meas</source>
          <year>1960</year>
          <month>07</month>
          <day>2</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>37</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>O'Dea</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Immune therapy in sepsis: are we ready to try again?</article-title>
          <source>J Intensive Care Soc</source>
          <year>2018</year>
          <month>11</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>326</fpage>
          <lpage>44</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30515242"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1751143718765407</pub-id>
          <pub-id pub-id-type="medline">30515242</pub-id>
          <pub-id pub-id-type="pii">10.1177_1751143718765407</pub-id>
          <pub-id pub-id-type="pmcid">PMC6259080</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cabrera-Perez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Condotta</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Badovinac</surname>
              <given-names>VP</given-names>
            </name>
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>TS</given-names>
            </name>
          </person-group>
          <article-title>Impact of sepsis on CD4 T cell immunity</article-title>
          <source>J Leukoc Biol</source>
          <year>2014</year>
          <month>11</month>
          <volume>96</volume>
          <issue>5</issue>
          <fpage>767</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24791959"/>
          </comment>
          <pub-id pub-id-type="doi">10.1189/jlb.5MR0114-067R</pub-id>
          <pub-id pub-id-type="medline">24791959</pub-id>
          <pub-id pub-id-type="pii">jlb.5MR0114-067R</pub-id>
          <pub-id pub-id-type="pmcid">PMC4197564</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="web">
          <source>NCBI Bookshelf</source>
          <year>2019</year>
          <access-date>2020-06-10</access-date>
          <comment>UMLS Reference Manual<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK9685/table/ch03.T.related_concepts_file_mrrel_rrf/">https://www.ncbi.nlm.nih.gov/books/NBK9685/table/ch03.T.related_concepts_file_mrrel_rrf/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Viera</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Garrett</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Understanding interobserver agreement: the kappa statistic</article-title>
          <source>Fam Med</source>
          <year>2005</year>
          <month>05</month>
          <volume>37</volume>
          <issue>5</issue>
          <fpage>360</fpage>
          <lpage>3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.stfm.org/fmhub/fm2005/May/Anthony360.pdf"/>
          </comment>
          <pub-id pub-id-type="medline">15883903</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feinstein</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Cicchetti</surname>
              <given-names>DV</given-names>
            </name>
          </person-group>
          <article-title>High agreement but low kappa: I. The problems of two paradoxes</article-title>
          <source>J Clin Epidemiol</source>
          <year>1990</year>
          <volume>43</volume>
          <issue>6</issue>
          <fpage>543</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/0895-4356(90)90158-l</pub-id>
          <pub-id pub-id-type="medline">2348207</pub-id>
          <pub-id pub-id-type="pii">0895-4356(90)90158-L</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cicchetti</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Feinstein</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>High agreement but low kappa: II. Resolving the paradoxes</article-title>
          <source>J Clin Epidemiol</source>
          <year>1990</year>
          <volume>43</volume>
          <issue>6</issue>
          <fpage>551</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/0895-4356(90)90159-m</pub-id>
          <pub-id pub-id-type="medline">2189948</pub-id>
          <pub-id pub-id-type="pii">0895-4356(90)90159-M</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lehrer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>The Influence of Semantic Fields on Semantic Change</source>
          <year>1985</year>
          <publisher-loc>Berlin, Germany</publisher-loc>
          <publisher-name>De Gruyter Mouton</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="web">
          <source>BMJ Best Practice</source>
          <access-date>2020-06-01</access-date>
          <comment>Asthma in Adults<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bestpractice.bmj.com/topics/en-gb/44">http://bestpractice.bmj.com/topics/en-gb/44</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dagan</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Improving distributional similarity with lessons learned from word embeddings</article-title>
          <source>Trans Assoc Comput Linguist</source>
          <year>2015</year>
          <month>12</month>
          <volume>3</volume>
          <fpage>211</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00134</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Crichton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Korhonen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pyysalo</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>How to Train good Word Embeddings for Biomedical NLP</article-title>
          <source>Proceedings of the 15th Workshop on Biomedical Natural Language Processing</source>
          <year>2016</year>
          <conf-name>ACL'16</conf-name>
          <conf-date>August 12, 2016</conf-date>
          <conf-loc>Berlin, Germany</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/w16-2922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hospedales</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Analogies Explained: Towards Understanding Word Embeddings</article-title>
          <source>Proceedings of the 36th International Conference on Machine Learning</source>
          <year>2019</year>
          <conf-name>ICML'19</conf-name>
          <conf-date>June 9-15, 2019</conf-date>
          <conf-loc>Long Beach, California, USA</conf-loc>
          <fpage>223</fpage>
          <lpage>231</lpage>
          <pub-id pub-id-type="doi">10.1201/9780429469275-13</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McEwan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Corpus domain effects on distributional semantic modeling of medical terms</article-title>
          <source>Bioinformatics</source>
          <year>2016</year>
          <month>12</month>
          <day>1</day>
          <volume>32</volume>
          <issue>23</issue>
          <fpage>3635</fpage>
          <lpage>44</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27531100"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btw529</pub-id>
          <pub-id pub-id-type="medline">27531100</pub-id>
          <pub-id pub-id-type="pii">btw529</pub-id>
          <pub-id pub-id-type="pmcid">PMC5181540</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tresp</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Overhage</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Bundschus</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rabizadeh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fasching</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Going digital: a survey on digitalization and large-scale data analytics in healthcare</article-title>
          <source>Proc IEEE</source>
          <year>2016</year>
          <month>11</month>
          <volume>104</volume>
          <issue>11</issue>
          <fpage>2180</fpage>
          <lpage>206</lpage>
          <pub-id pub-id-type="doi">10.1109/JPROC.2016.2615052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="web">
          <source>Government of UK</source>
          <access-date>2020-06-01</access-date>
          <comment>Personalised Health and Care 2020<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gov.uk/government/publications/personalised-health-and-care-2020">https://www.gov.uk/government/publications/personalised-health-and-care-2020</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="web">
          <source>National Library of Medicine - National Institutes of Health - NIH</source>
          <access-date>2020-06-01</access-date>
          <comment>The CORE Problem List Subset of SNOMED CT<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/research/umls/Snomed/core_subset.html">https://www.nlm.nih.gov/research/umls/Snomed/core_subset.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="web">
          <source>NHS Digital</source>
          <access-date>2020-06-01</access-date>
          <comment>SNOMED CT Subset Members in Spreadsheet View<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://isd.digital.nhs.uk/trud3/user/guest/group/0/pack/40">https://isd.digital.nhs.uk/trud3/user/guest/group/0/pack/40</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Patwardhan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Measures of semantic similarity and relatedness in the biomedical domain</article-title>
          <source>J Biomed Inform</source>
          <year>2007</year>
          <month>07</month>
          <volume>40</volume>
          <issue>3</issue>
          <fpage>288</fpage>
          <lpage>99</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(06)00064-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2006.06.004</pub-id>
          <pub-id pub-id-type="medline">16875881</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(06)00064-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Semantic similarity and relatedness between clinical terms: an experimental study</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2010</year>
          <month>12</month>
          <day>13</day>
          <volume>2010</volume>
          <fpage>572</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21347043"/>
          </comment>
          <pub-id pub-id-type="medline">21347043</pub-id>
          <pub-id pub-id-type="pmcid">PMC3041430</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
