<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i5e23586</article-id>
      <article-id pub-id-type="pmid">34032581</article-id>
      <article-id pub-id-type="doi">10.2196/23586</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Leveraging Genetic Reports and Electronic Health Records for the Prediction of Primary Cancers: Algorithm Development and Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Silva</surname>
            <given-names>João Figueira</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhou</surname>
            <given-names>Xiaobing</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Zong</surname>
            <given-names>Nansu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0066-9524</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ngo</surname>
            <given-names>Victoria</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9973-8379</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Stone</surname>
            <given-names>Daniel J</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4506-0712</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Wen</surname>
            <given-names>Andrew</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9090-8028</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Yiqing</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2874-8136</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>Yue</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3900-1217</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Sijia</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9763-1164</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Ming</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7367-3626</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Chen</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2638-3081</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Guoqian</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Health Sciences Research</institution>
            <institution>Mayo Clinic</institution>
            <addr-line>200 First Street</addr-line>
            <addr-line>Rochester, MN </addr-line>
            <country>United States</country>
            <phone>1 480 301 8000</phone>
            <email>Jiang.Guoqian@mayo.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2940-0019</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Health Sciences Research</institution>
        <institution>Mayo Clinic</institution>
        <addr-line>Rochester, MN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>University of California Davis Health</institution>
        <addr-line>Sacramento, CA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Guoqian Jiang <email>Jiang.Guoqian@mayo.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>5</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>25</day>
        <month>5</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>5</issue>
      <elocation-id>e23586</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>8</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>27</day>
          <month>1</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Nansu Zong, Victoria Ngo, Daniel J Stone, Andrew Wen, Yiqing Zhao, Yue Yu, Sijia Liu, Ming Huang, Chen Wang, Guoqian Jiang. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 25.05.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/5/e23586" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Precision oncology has the potential to leverage clinical and genomic data in advancing disease prevention, diagnosis, and treatment. A key research area focuses on the early detection of primary cancers and potential prediction of cancers of unknown primary in order to facilitate optimal treatment decisions.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study presents a methodology to harmonize phenotypic and genetic data features to classify primary cancer types and predict cancers of unknown primaries.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We extracted genetic data elements from oncology genetic reports of 1011 patients with cancer and their corresponding phenotypical data from Mayo Clinic’s electronic health records. We modeled both genetic and electronic health record data with HL7 Fast Healthcare Interoperability Resources. The semantic web Resource Description Framework was employed to generate the network-based data representation (ie, patient-phenotypic-genetic network). Based on the Resource Description Framework data graph, Node2vec graph-embedding algorithm was applied to generate features. Multiple machine learning and deep learning backbone models were compared for cancer prediction performance.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>With 6 machine learning tasks designed in the experiment, we demonstrated the proposed method achieved favorable results in classifying primary cancer types (area under the receiver operating characteristic curve [AUROC] 96.56% for all 9 cancer predictions on average based on the cross-validation) and predicting unknown primaries (AUROC 80.77% for all 8 cancer predictions on average for real-patient validation). To demonstrate the interpretability, 17 phenotypic and genetic features that contributed the most to the prediction of each cancer were identified and validated based on a literature review.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Accurate prediction of cancer types can be achieved with existing electronic health record data with satisfactory precision. The integration of genetic reports improves prediction, illustrating the translational values of incorporating genetic tests early at the diagnosis stage for patients with cancer.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>genetic reports</kwd>
        <kwd>electronic health records</kwd>
        <kwd>predicting primary cancers</kwd>
        <kwd>Fast Healthcare Interoperability Resources</kwd>
        <kwd>FHIR</kwd>
        <kwd>Resource Description Framework</kwd>
        <kwd>RDF</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Cancer is the second leading cause of death worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. The health burden of cancer in the United States is substantial [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>], with approximately 1.8 million new diagnoses and an estimated 600,000 deaths in 2020 alone [<xref ref-type="bibr" rid="ref4">4</xref>]. Despite the advances in characterizing oncogenic mutations in the past few decades, overcoming the consequences of cellular self-renewal and neoplastic transformation remains a challenge in cancer therapy research [<xref ref-type="bibr" rid="ref5">5</xref>]. Therefore, continued discoveries in causes, treatment, and management are needed to further the knowledge and understanding of this collection of related diseases [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Modern gene technology has provided an opportunity to identify certain gene mutations associated with increased cancer risk. Approximately 5% to 10% of all cancer diagnoses are linked to cancer predisposition syndromes [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Major syndromes of cancer disposition affecting adults include breast, ovarian, prostate, gastric, and pancreatic cancer [<xref ref-type="bibr" rid="ref7">7</xref>]. Precision medicine initiatives call for the leveraging of clinical and genomic data to not only screen for cancers but also to help monitor cancer progression and guide therapy options [<xref ref-type="bibr" rid="ref10">10</xref>]. Clinicians can facilitate early screening critical for risk assessment and surveillance [<xref ref-type="bibr" rid="ref8">8</xref>]. If cancer is detected at an early stage, survival rates tend to be significantly higher than those for cancers diagnosed at an advanced stage [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Nash et al [<xref ref-type="bibr" rid="ref11">11</xref>] cite figures as drastic as 90% survival for early ovarian cancer detection compared to only 5% survival with advanced stage detection, as an example. The utilization of genetic tests in diagnosing primary cancer also becomes critical when the symptoms and the physical exams suggest unspecified cancer known as cancer of unknown primary [<xref ref-type="bibr" rid="ref14">14</xref>]. Cancer of unknown primary accounts for 3% to 5% of all tumors [<xref ref-type="bibr" rid="ref15">15</xref>]. The prediction of the primary cancer of cancer of unknown primary can significantly increase our current knowledge of metastasis and benefit the treatment of patients with cancer of unknown primary.</p>
      <p>The implementation and adoption of health information technology have given frontline clinicians access to a large repository of longitudinal clinical data collected during health care encounters [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Medical insight and clinical decision making rely heavily upon access to these data from electronic health records. Artificial intelligence techniques, such as machine learning methods, are promising for finding patterns and discovering associations in health care data to help predict diseases [<xref ref-type="bibr" rid="ref18">18</xref>]. Improved predictions can be made by integrating diverse types of digital data in patients’ charts, which include diagnosis codes, clinical notes, laboratory test results, and treatment data [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>As demand grows for genetic testing from patients and as genomic data continue to be incorporated into electronic health records, there is a need to study how genetic reports, along with electronic health record data, can be leveraged to predict cancers. Conventional computational methods for predictive models are based on features extracted from diverse data sources, known as bag of features [<xref ref-type="bibr" rid="ref20">20</xref>]. The features in these models are treated independently, and the potential connections and patterns among the features cannot be fully explored to serve the prediction. A network-based data model can be used to represent the association between data models with edges, and the potential patterns are embedded in the topological structure of the network. Predictions from network-based data representations have achieved promising results in diverse biomedical areas, such as drug-target prediction [<xref ref-type="bibr" rid="ref21">21</xref>] and patient clustering [<xref ref-type="bibr" rid="ref22">22</xref>]. Representing correlations among phenotypic and genetic data elements through network-based data modeling shows great potential in cancer prediction.</p>
      <p>The objective of this study was to harmonize phenotypic and genetic features for accurate and explainable cancer prediction, specifically: (1) developing a network-based framework with standard health care data exchange frameworks, the HL7 Fast Healthcare Interoperability Resources (FHIR) [<xref ref-type="bibr" rid="ref23">23</xref>] and the Resource Description Framework (RDF) for graph-based data representations, (2) employing a state-of-the-art graph embedding algorithm, Node2vec [<xref ref-type="bibr" rid="ref24">24</xref>], to obtain features for machine learning and deep learning models, and (3) implementing the proposed method with a collection of genetic reports of patients with cancer and the corresponding phenotypic data from Mayo Clinic’s electronic health record systems and comprehensive experiments.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Preliminary</title>
        <p>FHIR is a standardized data framework designed for data exchange between different medical centers to enable information to be captured as it is generated, significantly simplifying population and real-time updates of predefined data models [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The FHIR specification defines a set of granular clinical concepts and resources to provide standard data infrastructure to support implementations [<xref ref-type="bibr" rid="ref23">23</xref>]. FHIR-based data models are built upon combinations of these resources and a set of attributes with value types. The common attributes (eg, <italic>identifier</italic>) and unique attributes (eg, <italic>bodySite</italic>) in a resource are used to facilitate data modeling. Common data types (eg, <italic>String</italic> and <italic>CodeableConcepts</italic>) are used to constrain the attribute based on an adaptation of clinically related ontologies, such as SNOMED CT [<xref ref-type="bibr" rid="ref26">26</xref>], LOINC [<xref ref-type="bibr" rid="ref27">27</xref>], and International Statistical Classification of Diseases ninth (ICD-9) and tenth revisions (ICD-10) [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        <p>RDF is a general metadata or data model that defines concepts and web-resources based on a variety of syntax notations and data serialization formats [<xref ref-type="bibr" rid="ref29">29</xref>]. Inherited from the classical conceptual modeling approaches, RDF utilizes the expressions to form triples, subject-predicate-object, to model data elements (eg, web resources). Specifically, in this study, the subject denotes the clinical data elements (eg, patients), and the predicate denotes a relationship between 2 data elements.</p>
      </sec>
      <sec>
        <title>Framework</title>
        <p>We proposed a network-based framework (<xref rid="figure1" ref-type="fig">Figure 1</xref>) that represented cancer data using the FHIR standard and RDF to facilitate the cancer prediction process. Five types of data sources extracted from the electronic health record—genetic information, lab tests, diagnosis, medication, and family historical records—were represented with FHIR resources and converted to the RDF-based representation. A graph-embedding algorithm, Node2vec, was used to provide a vectorial representation of nodes in the resulting network along with bag of features to form the features for the classification models.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>A network-based framework for cancer prediction based on Fast Healthcare Interoperability Resources and Resource Description Framework.</p>
          </caption>
          <graphic xlink:href="medinform_v9i5e23586_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Genetic data were extracted from 1011 aggregated anonymized genetic test results (Foundation Medicine Inc), including microsatellite instability and tumor mutational burden. Medical record data elements related to laboratory results, diagnoses, medications, and family histories were extracted from approximately 515,000 billing encounters (666,000 electronic health record encounters) retrieved from a Mayo Clinic clinical data warehouse of [<xref ref-type="bibr" rid="ref30">30</xref>]. We integrated genetic and electronic health record data by mapping patient information based on 3 data elements: patient clinic number, names (first and last name), and date of birth. Lab tests, diagnosis, medication, and family historical records were searched based on the mapped patients. We used natural language processing to normalize the names and values. For <italic>diagnosis</italic> and <italic>medication</italic>, all diseases and medications were represented with standardized names encoded by ICD-9 [<xref ref-type="bibr" rid="ref31">31</xref>] and RxNorm [<xref ref-type="bibr" rid="ref32">32</xref>] codes. For lab tests, we represented all the tests with standard names encoded by LOINC [<xref ref-type="bibr" rid="ref27">27</xref>]. For <italic>family historical records</italic>, each record was processed by a pipeline (NLP2FHIR [<xref ref-type="bibr" rid="ref33">33</xref>]), where the medical concepts were identified and normalized using cTAKES [<xref ref-type="bibr" rid="ref34">34</xref>], MedXN [<xref ref-type="bibr" rid="ref35">35</xref>], and MedTime [<xref ref-type="bibr" rid="ref36">36</xref>]. We encoded the diseases from family historical records using ICD-9 codes. To build the data set utilized for the cancer prediction, all the records within the billing circle related to the target cancers were removed. The top 10 elements in each data source can be found in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Distribution of the top 10 elements in each data source.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="120"/>
            <col width="600"/>
            <col width="0"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td colspan="4">Code and verbatim description</td>
                <td>Record, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Genes</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>TP53</italic>
                </td>
                <td>tumor protein p53</td>
                <td colspan="2">553 (54.70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>KRAS</italic>
                </td>
                <td>KRAS proto-oncogene, GTPase</td>
                <td colspan="2">292 (28.88)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MLL2</italic>
                </td>
                <td>lysine methyltransferase 2D<sup>a</sup></td>
                <td colspan="2">173 (17.11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>LRP1B</italic>
                </td>
                <td>LDL receptor related protein 1B</td>
                <td colspan="2">171 (16.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MLL3</italic>
                </td>
                <td>lysine methyltransferase 2C<sup>a</sup></td>
                <td colspan="2">150 (14.84)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>APC</italic>
                </td>
                <td>APC regulator of WNT signaling pathway</td>
                <td colspan="2">141 (13.95)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>ARID1B</italic>
                </td>
                <td>AT-rich interaction domain 1B</td>
                <td colspan="2">137 (13.55)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>FAT1</italic>
                </td>
                <td>FAT atypical cadherin 1</td>
                <td colspan="2">134 (13.25)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>PRKDC</italic>
                </td>
                <td>protein kinase, DNA-activated, catalytic subunit</td>
                <td colspan="2">128 (12.66)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>ARID1A</italic>
                </td>
                <td>AT-rich interaction domain 1A</td>
                <td colspan="2">126 (12.46)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Diagnosis<sup>b</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Z02.9</td>
                <td>Work Status Exam (RTW)</td>
                <td colspan="2">204 (25.66)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I10</td>
                <td>Hypertension (HTN) Chronic</td>
                <td colspan="2">142 (17.86)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>401.9</td>
                <td>HYPERTENSION NOS</td>
                <td colspan="2">138 (17.36)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>272.4</td>
                <td>HYPERLIPIDEMIA NEC/NOS</td>
                <td colspan="2">116 (14.59)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>R91.8</td>
                <td>Mass Lung</td>
                <td colspan="2">113 (14.21)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>V68.9</td>
                <td>ADMINISTRTVE ENCOUNT NOS</td>
                <td colspan="2">106 (13.33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Z00.00</td>
                <td>Maintenance Health (HM)</td>
                <td colspan="2">101 (12.70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>E78.5</td>
                <td>Dyslipidemia NOS</td>
                <td colspan="2">93 (11.70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>V72.83</td>
                <td>PREOP EXAMINATION NEC</td>
                <td colspan="2">79 (9.94)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>V70.0</td>
                <td>ROUTINE MEDICAL EXAM</td>
                <td colspan="2">79 (9.94)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Lab tests<sup>c</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>777-3</td>
                <td>Platelets [#/volume] in Blood by Automated count</td>
                <td colspan="2">991 (99.40)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2160-0</td>
                <td>Creatinine [Mass/volume] in Serum or Plasma</td>
                <td colspan="2">988 (99.10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>965763</td>
                <td>Hematocrit [Volume Fraction] of Blood by Automated count</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>718-7</td>
                <td>Hemoglobin [Mass/volume] in Blood</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>788-0</td>
                <td>Erythrocyte distribution width [Ratio] by Automated count</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>789-8</td>
                <td>Erythrocytes [#/volume] in Blood by Automated count</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1749545</td>
                <td>Leukocytes [#/volume] in Blood by Automated count</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>787-2</td>
                <td>MCV [Entitic volume] by Automated count</td>
                <td colspan="2">985 (98.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>337180</td>
                <td>Potassium [Moles/volume] in Serum or Plasma</td>
                <td colspan="2">975 (97.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>383903</td>
                <td>Sodium [Moles/volume] in Serum or Plasma</td>
                <td colspan="2">973 (97.60)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Family historical records<sup>b</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>V47.2</td>
                <td>Other cardiorespiratory problems</td>
                <td colspan="2">205 (29.54)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>429.9</td>
                <td>Heart disease, unspecified</td>
                <td colspan="2">205 (29.54)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>429.89</td>
                <td>Other ill-defined heart diseases</td>
                <td colspan="2">205 (29.54)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>162.9</td>
                <td>Malignant neoplasm of bronchus and lung, unspecified</td>
                <td colspan="2">133 (19.16)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>162.8</td>
                <td>Malignant neoplasm of other parts of bronchus or lung</td>
                <td colspan="2">130 (18.73)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>272.4</td>
                <td>Other and unspecified hyperlipidemia</td>
                <td colspan="2">124 (17.87)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>434.91</td>
                <td>Cerebral artery occlusion, unspecified with cerebral infarction</td>
                <td colspan="2">104 (14.99)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>799.9</td>
                <td>Other unknown and unspecified cause of morbidity and mortality</td>
                <td colspan="2">84 (12.10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>311</td>
                <td>Depressive disorder, not elsewhere classified</td>
                <td colspan="2">72 (10.37)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>447.9</td>
                <td>Unspecified disorders of arteries and arterioles</td>
                <td colspan="2">63 (9.08)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Medication<sup>d</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>5956</td>
                <td>Iohexol</td>
                <td colspan="2">399 (72.41)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1359867</td>
                <td>Sodium Chloride 9 MG/ML Prefilled Syringe</td>
                <td colspan="2">374 (67.88)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1807638</td>
                <td>20 ML Sodium Chloride 9 MG/ML Injection</td>
                <td colspan="2">304 (55.17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1807639</td>
                <td>1000 ML Sodium Chloride 9 MG/ML Injection</td>
                <td colspan="2">298 (54.08)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1740467</td>
                <td>2 ML Ondansetron 2 MG/ML Injection</td>
                <td colspan="2">251 (45.55)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4337</td>
                <td>Fentanyl</td>
                <td colspan="2">224 (40.65)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>314659</td>
                <td>heparin sodium, porcine</td>
                <td colspan="2">207 (37.57)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>847630</td>
                <td>Calcium Chloride 0.0014 MEQ/ML / Potassium Chloride 0.004 MEQ/ML / Sodium Chloride 0.103 MEQ/ML / Sodium Lactate 0.028 MEQ/ML Injectable Solution</td>
                <td colspan="2">202 (36.66)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>198440</td>
                <td>Acetaminophen 500 MG Oral Tablet</td>
                <td colspan="2">188 (34.12)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1808234</td>
                <td>10 ML Propofol 10 MG/ML Injection</td>
                <td colspan="2">163 (29.58)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Cancers<sup>b</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>162.9</td>
                <td>Malignant neoplasm of bronchus and lung, unspecified</td>
                <td colspan="2">231 (22.85)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>153.9</td>
                <td>Malignant neoplasm of colon, unspecified site</td>
                <td colspan="2">124 (12.27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>155</td>
                <td>Malignant neoplasm of liver, primary</td>
                <td colspan="2">118 (12.67)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>157.9</td>
                <td>Malignant neoplasm of pancreas, part unspecified</td>
                <td colspan="2">116 (11.47)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>183</td>
                <td>Malignant neoplasm of ovary</td>
                <td colspan="2">85 (8.41)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>185</td>
                <td>Malignant neoplasm of prostate</td>
                <td colspan="2">80 (7.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>171.9</td>
                <td>Malignant neoplasm of connective and other soft tissue, site unspecified</td>
                <td colspan="2">68 (6.73)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>193</td>
                <td>Malignant neoplasm of thyroid gland</td>
                <td colspan="2">55 (5.44)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>174.9</td>
                <td>Malignant neoplasm of breast (female), unspecified</td>
                <td colspan="2">53 (5.24)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>—<sup>e</sup></td>
                <td>—</td>
                <td colspan="2">—</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Current standard gene symbols: <italic>MLL2</italic> is now <italic>KMT2D</italic>; <italic>MLL3</italic> is now <italic>KMT2C.</italic></p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>International Statistical Classification of Diseases (ninth revision) code and description.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>LOINC code and description.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>RxNorm code and description.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>A tenth item is not included.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Preprocessing and Data Modeling Based on FHIR and RDF</title>
        <p>We adapted FHIR-based data models from our previous work [<xref ref-type="bibr" rid="ref37">37</xref>] employing FHIR resources to represent data elements of genetic reports and structured electronic health record data for phenome-wide association studies. Specifically, we represented <italic>genetic</italic> entries with the existing profile <italic>Observation-genetics</italic>, extended from the resource <italic>Observation</italic>. The <italic>lab test</italic>, <italic>diagnosis</italic>, and <italic>medication</italic> entries were represented with the resources <italic>Observation</italic>, <italic>Condition</italic>, and <italic>Medication</italic>, respectively, and were identified by encounters (eg, billing and electronic health record encounters) and service date. The <italic>family historical records</italic> entities were represented with the resource <italic>FamilyMemberHistory</italic> as diseases and were encoded with the attributed condition. All the resources were associated with the resource <italic>Patient</italic>. We further converted the JavaScript object notation–formatted FHIR data to RDF format based on the conversion rules, where (1) all the string-type values were considered as the entities in the RDF graph, and (2) all the values of the resources were considered as the object of the data-type property—named after the resource for the subject resource <italic>Patient</italic>. We illustrated an example of data representation based on FHIR and RDF in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>An example of data representation based on Fast Healthcare Interoperability Resources (FHIR) and Resource Description Framework (RDF): 2 JavaScript object notation–formatted FHIR representations for patients 1 and 2 are merged and converted into 1 RDF graph.</p>
          </caption>
          <graphic xlink:href="medinform_v9i5e23586_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Feature Generation and Cancer Prediction</title>
        <sec>
          <title>Bag of Features</title>
          <p>Bag of features is analogous to the bag-of-words representation and characterizes a sample with an orderless collection of features [<xref ref-type="bibr" rid="ref38">38</xref>]. In this study, we used bag of features based on the attribute values from the FHIR model. Specifically, categorical values of mutated genes, lab test results, disease diagnoses, medications for treatment, and historical family disease diagnoses were collected as the features from <italic>Observation-genetics</italic>, <italic>Observation</italic>, <italic>Condition</italic>, <italic>Medication</italic>, and <italic>FamilyMemberHistory</italic>, respectively. Additionally, patient demographic features, such as age and gender, were also used.</p>
        </sec>
        <sec>
          <title>Topological Features</title>
          <p>In order to train a model with the features generated from the input RDF data, we adapted a methodology [<xref ref-type="bibr" rid="ref21">21</xref>] that considered RDF graph as a network, <italic>G</italic>(<italic>V</italic>,<italic>E</italic>) with a set of vertices <italic>V</italic> and a set of edges <italic>E</italic>, where <italic>V</italic> has 7 types of vertices (ie, genetics, lab tests, diagnosis, medication, family historical records, demographics, and patients) and <italic>E</italic> represents associations between the 6 types of vertices (ie, genetics, lab tests, diagnosis, medication, family historical records, demographics) and patients. We used the graph embedding method to learn the features of the patients, where a patient could be represented by a vector embedded within the topological structure of the patient in the network <italic>G</italic>. Node2vec [<xref ref-type="bibr" rid="ref30">30</xref>] is a state-of-art graph embedding method that vectorizes the vertices of a network based on the topology of the network by maximizing the probability of observing the neighborhood <italic>N</italic>(<italic>u</italic>) of each node <italic>u</italic> in <italic>G</italic>:</p>
          <graphic xlink:href="medinform_v9i5e23586_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>where</p>
          <graphic xlink:href="medinform_v9i5e23586_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>and <italic>f</italic> (∙) was the feature representation of a node. In addition, we also generated a &#124;<italic>V</italic>&#124;×&#124;<italic>V</italic>&#124; adjacency matrix from <italic>G</italic>, where each cell of the matrix was set to 1 if there was a connection between nodes, otherwise the cell was set to 0.</p>
          <p>We modeled cancer prediction as a multiple-label classification problem, where a given patient was represented with k-dimensional features, and a model categorized the patient into precisely 1 of 9 cancer types: colon cancer (ICD-9: 153.9), pancreas cancer (ICD-9: 157.9), ovary cancer (ICD-9: 183), prostate cancer (ICD-9: 185), connective and other soft tissue cancer (ICD-9: 171.9), thyroid gland cancer (ICD-9: 193), breast cancer (ICD-9: 174.9), liver cancer (ICD-9: 155), and bronchus and lung cancer (ICD-9: 162.9).</p>
        </sec>
      </sec>
      <sec>
        <title>Experiment Design</title>
        <sec>
          <title>Overview</title>
          <p>There were 2 main drivers of this study: (1) from a methodological perspective—how could generated features be coordinated with classification methods in a favorable manner to achieve satisfactory prediction?—and (2) from a data perspective—which data sources, especially genetic data, are preferable in prediction? Our experiment was thus conducted as a sequence of 6 distinct tasks.</p>
        </sec>
        <sec>
          <title>Task 1: Comparison of Combinations of Features and Popular Classification Methods</title>
          <p>A comparison of 3 feature generation methods—bag of features, Node2vec, and bag of features+Node2vec (ie, a linear combination of bag of features and Node2vec)—was conducted. Seven classification methods—random forest [<xref ref-type="bibr" rid="ref39">39</xref>], naive Bayes [<xref ref-type="bibr" rid="ref40">40</xref>], logistic regression [<xref ref-type="bibr" rid="ref41">41</xref>], support vector machine [<xref ref-type="bibr" rid="ref42">42</xref>], deep neural network [<xref ref-type="bibr" rid="ref43">43</xref>], convolutional neural network [<xref ref-type="bibr" rid="ref44">44</xref>], and graph convolutional networks [<xref ref-type="bibr" rid="ref45">45</xref>]—were used.</p>
        </sec>
        <sec>
          <title>Task 2: Comparison of Combinations of Data Sources</title>
          <p>There were 5 types of data sources used in this study. We took all possible combinations of the data sources into consideration and studied how the features generated from these sources affected the results.</p>
        </sec>
        <sec>
          <title>Task 3: Comparison of Predictions for Each Cancer</title>
          <p>To understand how the prediction varied in different cancers predictions, we conducted 9 prediction tasks for all the cancers to study.</p>
        </sec>
        <sec>
          <title>Task 4: Analysis of Feature Contribution for Each Cancer Prediction</title>
          <p>To interpret the model and understand which features were important to each cancer, we studied the features that contributed most to the prediction of cancer.</p>
        </sec>
        <sec>
          <title>Task 5: Time Effect of Cancer Prediction</title>
          <p>To understand how the prediction could be made precisely prior to a certain amount of time of the diagnosis, we studied the prediction based on data collected at different duration, ranging from 0 to 24 months, in advance.</p>
        </sec>
        <sec>
          <title>Task 6: Prediction of Cancer of Unknown Primary Patients</title>
          <p>We identified the 43 primary cancers from 81 patients with cancer of unknown primary based on the diagnosis records to understand how the proposed method performed for real cancer predictions. Please note, no patients with pancreas cancer of unknown primary were identified, and therefore, pancreatic cancer was not considered in this task.</p>
        </sec>
      </sec>
      <sec>
        <title>Feature Selection and Classification</title>
        <p>Two methods were used to generate features: bag of features and Node2vec. For bag of features, all genes, diseases, drugs in genetics, diagnosis, medication, and family historical records were considered as features. For the lab tests<italic>,</italic> the values were converted into categorical values (Null, Normal, or Abnormal) based on the normal range defined in the unified data platform. To avoid overfitting, the features were reduced to <italic>d</italic>={10,20,30,40,50,60,70,80,90,100} based on information gain [<xref ref-type="bibr" rid="ref46">46</xref>]. For Node2vec, the parameter ranges for the grid search were specified as the number of walks γ={10,40}, return <italic>P</italic>={0.5,1.0,2.0}, in-out <italic>q</italic>={0.5,1.0,2.0}, dimension <italic>d</italic>={10,20,30,40,50,60,70,80,90,100}, window size <italic>w</italic>={5,10}, and walk length <italic>t</italic>={40,80}.</p>
        <p>Four popular machine learning models and 3 deep learning models were used for classification. For machine learning methods, the following settings were used: L2 regularization for logistic regression, type C-SVC and linear kernel for support vector machine, 500 trees for random forest, and default settings for naive Bayes. For deep learning methods, the following structure were used: 5 dense layers with dimensions {256, 256,128, 64, 10} (4 rectified linear unit [ReLU] activation functions with 0.5 dropout rate and 1 softmax activation function) for deep neural network, 3 convolution layers with filters {256, 256, 256} (3 ReLU activation functions and maxpooling layers with 0.5 dropout rate) followed with 4 dense layers with dimensions {256,128, 64, 10} (3 ReLU activation functions with 0.5 dropout rate and 1 softmax activation function) for convolutional neural network, and 2 graph convolutional layers with channels {64, 10}(1 ReLU activation function with 0.5 dropout rate and 1 softmax activation function) for graph convolutional networks.</p>
        <p>Node2vec was obtained from the Node2vec library [<xref ref-type="bibr" rid="ref47">47</xref>]. The logistic regression classifier was obtained from the LIBLINEAR library [<xref ref-type="bibr" rid="ref48">48</xref>]; naive Bayes, random forest, and information gain algorithms were obtained from Weka library [<xref ref-type="bibr" rid="ref49">49</xref>], support vector machine was obtained from LIBSVM [<xref ref-type="bibr" rid="ref50">50</xref>]. Deep neural network and graph convolutional networks were constructed based on Keras library [<xref ref-type="bibr" rid="ref51">51</xref>]. Graph convolutional networks algorithms were obtained from Spektral library [<xref ref-type="bibr" rid="ref52">52</xref>].</p>
      </sec>
      <sec>
        <title>Validation and Evaluation Metrics</title>
        <p>We used conventional 10-fold cross-validation for the evaluation, where 10 independent iterations of training and testing were conducted, and a random partition of the original samples into 10 equal-size subsamples was performed. To assess the quality of classification, we used area under the receiver operating characteristic curve (AUROC) [<xref ref-type="bibr" rid="ref53">53</xref>]. In addition, the area under the precision-recall curve (AUPRC) [<xref ref-type="bibr" rid="ref53">53</xref>] was used as a supplementary metric characterizing the results for imbalanced classes [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. AUROC and AUPRC scores were calculated using the Java Receiver Operating Characteristic library [<xref ref-type="bibr" rid="ref56">56</xref>] and Weka evaluation package [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Combinations of Features and Popular Classification Methods</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the best performance result was achieved by using bag of features+Node2vec and random forest (AUROC 96.19%) (AUPRC: Table S1, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Generally, using bag of features+Node2vec outperformed using bag of features (+1.27 %) and Node2vec (+1.41%). Although we observed that machine learning–based methods outperformed deep learning–based methods, in general, the best deep learning–based approach (AUROC 95.12%) was second to the best machine learning–based approach by only 1 percentage-point difference (outperforming the remaining machine learning–based approaches). As our implementation of deep learning models is based on simple architectures, the deep learning models with more complex architectures have the potential to facilitate feature generation and may directly contribute to improvements in cancer prediction.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Prediction performance (area under the receiver operatic characteristic curve) for combinations of features and classification methods.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="200"/>
            <col width="200"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Classifiers</td>
                <td colspan="3">Feature generation algorithm</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bag of features</td>
                <td>Node2vec</td>
                <td>Bag of features+Node2vec</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AUROC<sup>a</sup> (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Random forest</td>
                <td>94.82</td>
                <td>91.89</td>
                <td>96.19</td>
              </tr>
              <tr valign="top">
                <td>Naive Bayes</td>
                <td>92.30</td>
                <td>92.91</td>
                <td>94.76</td>
              </tr>
              <tr valign="top">
                <td>Logistic regression</td>
                <td>86.68</td>
                <td>85.25</td>
                <td>89.39</td>
              </tr>
              <tr valign="top">
                <td>Support vector machine</td>
                <td>84.62</td>
                <td>83.92</td>
                <td>86.72</td>
              </tr>
              <tr valign="top">
                <td>Convolutional neural network</td>
                <td>64.14</td>
                <td>63.36</td>
                <td>57.68</td>
              </tr>
              <tr valign="top">
                <td>Deep neural network</td>
                <td>92.56</td>
                <td>92.87</td>
                <td>95.12</td>
              </tr>
              <tr valign="top">
                <td>Graph convolutional networks</td>
                <td>79.67</td>
                <td>83.62</td>
                <td>83.83</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Combinations of Data Sources</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows better results were achieved by the model DML+G (diagnosis, medication, lab test, and genetic information; AUROC 96.56%). Steady improvement is obtained when more features are used (AUPRC: Table S2, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For example, increasing average AUROCs (75.49%, 82.65%, 87.98%, and 91.74%) are achieved by adding 1 to 5 features successively without using genetic information. <xref ref-type="table" rid="table3">Table 3</xref> also presents the importance of the features, where lab test is the most important feature (91.00%), followed by diagnosis (73.12%), medication (72.83%), and family historical records (65.01%). We also demonstrated the value of genetic information for cancer prediction—an average improvement of 10.52% was reached. Interestingly, such improvement is weakened when more feature types are used (+15.76% for using 1 feature type, +10.45% for 2 feature types, +6.92% for 3 feature types, and +4.45% for 4 feature types). <xref ref-type="table" rid="table3">Table 3</xref> also indicates the potential of using diverse types of features alternatively when genetic information is not available.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Prediction performance for combinations of data sourcing with bag of features+Node2vec and random forest algorithms.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="470"/>
            <col width="0"/>
            <col width="250"/>
            <col width="0"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Feature types</td>
                <td colspan="4">AUROC<sup>a</sup> (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">Base feature set</td>
                <td>With genetic information</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>1 feature type</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">G<sup>b</sup></td>
                <td colspan="2">73.12</td>
                <td>90.89</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">D<sup>c</sup></td>
                <td colspan="2">65.01</td>
                <td>88.37</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">H<sup>d</sup></td>
                <td colspan="2">91.00</td>
                <td>95.80</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">L<sup>e</sup></td>
                <td colspan="2">72.83</td>
                <td>89.94</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">M<sup>f</sup></td>
                <td colspan="2">73.21</td>
                <td>90.92</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>2 feature types</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DH</td>
                <td colspan="2">91.55</td>
                <td>96.09</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DL</td>
                <td colspan="2">77.09</td>
                <td>90.88</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DM</td>
                <td colspan="2">91.30</td>
                <td>95.92</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">HL</td>
                <td colspan="2">71.53</td>
                <td>89.02</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">MH</td>
                <td colspan="2">91.22</td>
                <td>95.75</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">ML</td>
                <td colspan="2">91.98</td>
                <td>96.01</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>3 feature types</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DHL</td>
                <td colspan="2">76.76</td>
                <td>91.28</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DMH</td>
                <td colspan="2">91.76</td>
                <td>96.56</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DML</td>
                <td colspan="2">91.43</td>
                <td>95.76</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">MHL</td>
                <td colspan="2">91.74</td>
                <td>96.19</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>4 feature types</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">DMHL</td>
                <td colspan="2">73.12</td>
                <td>90.89</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>G: genetic information.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>D: diagnosis.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>H: family historical records.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>L: lab test.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>M: medication.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Predictions for Each Cancer</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows that the proposed method achieved high AUROC values across all 9 cancer types (AUPRC: Table S3, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), especially for thyroid gland (AUROC 99.80%), prostate (99.76%), breast (98.53%), ovary (98.29%), connective and other soft tissue (96.05%), and liver (95.41%). Genetic information improved the predictions in general (<italic>P</italic>&#60;.001) based on a Wilcoxon signed-rank test [<xref ref-type="bibr" rid="ref58">58</xref>], specifically for thyroid gland cancer (<italic>P</italic>=.03), ovary cancer (<italic>P</italic>=.03), connective and other soft tissue cancer (<italic>P</italic>=.03), liver cancer (<italic>P</italic>=.03), and colon cancer (<italic>P</italic>=.03).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Prediction performance for 9 cancer types.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="780"/>
            <col width="110"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td>Cancer (ICD-9<sup>a</sup> code)</td>
                <td colspan="2">AUROC<sup>b</sup> (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>DML<sup>c</sup></td>
                <td>DML+G<sup>d</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Malignant neoplasm of thyroid gland (193)</td>
                <td>99.55</td>
                <td>99.80</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of prostate (185)</td>
                <td>98.43</td>
                <td>99.76</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of breast (female), unspecified (174.9)</td>
                <td>96.80</td>
                <td>98.53</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of ovary (183)</td>
                <td>95.73</td>
                <td>98.29</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of connective and other soft tissue, site unspecified (171.9)</td>
                <td>82.39</td>
                <td>96.05</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of liver, primary (155)</td>
                <td>91.39</td>
                <td>95.41</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of pancreas, part unspecified (157.9)</td>
                <td>91.07</td>
                <td>95.41</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of bronchus and lung, unspecified (162.9)</td>
                <td>90.61</td>
                <td>93.24</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of colon, unspecified site (153.9)</td>
                <td>79.88</td>
                <td>92.56</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>ICD-9: International Statistical Classification of Diseases, ninth revision.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>DML: diagnosis, medication, and lab test.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>DML+G: diagnosis, medication, and lab test, and genetic information.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Feature Contributions for Each Cancer Prediction</title>
        <p>Our analysis examines the feature contribution based on SHAP values [<xref ref-type="bibr" rid="ref59">59</xref>] for the cancer prediction and selects the top 5 features interpretable for each cancer (<xref rid="figure3" ref-type="fig">Figure 3</xref>). Frequent common features are lab tests (11/17); cancer antigen 19-9 in serum or plasma (2.03%), carbohydrate antigen 19-9, S (1.76%), and cancer antigen 125 in serum or plasma by immunoassay (2.59%) are the most common features across all the cancer types. These lab tests are considered to be predictive biomarkers for prognosis and chemotherapeutic effect for carcinomas [<xref ref-type="bibr" rid="ref60">60</xref>-<xref ref-type="bibr" rid="ref63">63</xref>]. Two genes—KRAS proto-oncogene, GTPase homolog (<italic>KRAS</italic>) (1.46%) and adenoma polyposis coli regulator of WNT signaling pathway (<italic>APC</italic>) (1.60%) contribute the most cancer predictions. <italic>KRAS</italic> is the most commonly mutated oncogene in human cancers. The sustained expression and signaling of <italic>KRAS</italic> results in the progress of many cancers thus make it the high-priority target in clinical therapeutic implications [<xref ref-type="bibr" rid="ref64">64</xref>]. <italic>APC</italic> participates in a cytoplasmic complex and its mutation triggers negatively regulating canonical WNT signaling. <italic>APC</italic> counteracts proliferation, facilitates apoptosis, and suppresses tumor progression, thus APC-deficient tumors drive colorectal and gastric cancers [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>].</p>
        <p>Lab tests testosterone (2.49%) and prostate-specific antigen in serum or plasma (2.29%) were found to be the major contributors to prostate cancer prediction. Evidence supports the androgen hypothesis, where prostate cancer development and progression are related to androgens. These findings drive the studies to explore the correlation between testosterone and prostate cancer development and progression [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref68">68</xref>]. For thyroid gland cancer prediction, thyroglobulin antibody in serum or plasma by immunoassay (2.69%), thyroglobulin in serum or plasma (0.58%), T4 (thyroxine) (0.62%), and gene telomerase reverse transcriptase (<italic>TERT</italic>) (SHAP value 0.59%) were found to be the major contributors. Associations between autoimmune thyroiditis and thyroid cancer have been documented [<xref ref-type="bibr" rid="ref69">69</xref>] in studies where thyroid autoimmunity was assessed by measuring thyroglobulin antibody and thyroid peroxidase antibody [<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]. Thyroglobulin in serum also plays a key role in the surveillance of differentiated patients with thyroid cancer [<xref ref-type="bibr" rid="ref72">72</xref>]. <italic>TERT</italic> promoter mutations have been found to be strongly associated with different pathological types of thyroid cancers and are considered as the biomarker to the preoperative diagnosis and prognosis of thyroid cancers [<xref ref-type="bibr" rid="ref73">73</xref>]. Cancer antigen 15-3 in serum or plasma (1.57%) and cancer antigen 15-3 (CA 15-3) S (0.98%) lab tests are the major contributors to breast cancer prediction. Cancer antigen 15-3 is a protein made by a variety of cells, particularly breast cancer cells, and the cancer antigen 15-3 test is A biomarker test used to monitor breast cancer [<xref ref-type="bibr" rid="ref74">74</xref>]. In addition, the cancer markers alpha-fetoprotein, tumor marker, S (0.78%) and epidermal growth factor receptor (EGFR) (1.56) were found to be the main contributors for the prediction of cancers of the liver [<xref ref-type="bibr" rid="ref75">75</xref>] and bronchus and lung [<xref ref-type="bibr" rid="ref76">76</xref>]. In our study, sex appears to be the major contributor to prediction of cancers of the breast (0.76%), prostate (0.92%), and ovary (1.16%).</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Top 5 features contributing to cancer prediction.</p>
          </caption>
          <graphic xlink:href="medinform_v9i5e23586_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Time Effect of Cancer Prediction</title>
        <p><xref ref-type="table" rid="table5">Table 5</xref> shows predictions based on different resources with different combinations of time-dependent (diagnosis, medication, and lab test) features (AUPRC: Table S4, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Among the 7 models, diagnosis and lab test were the best (average AUROC 90.31 %). In general, the performance of prediction decreases as more time increases prior to the formal diagnosis. For example, the average performance was reduced from 92.37% to 77.18% from 0 months to 24 months in advance, with an average decrease of 3.04%. <xref ref-type="table" rid="table5">Table 5</xref> also demonstrates the performance of the model (ie, diagnosis, medication, lab test, and genetic information) based on genetic information (AUROC 91.38% at 24 months in advance, an improvement of +11.38% over diagnosis, medication, and lab test). The difference between the two increase as time increases (eg, 1.06 for 0 months to 11.38% for 24 months), which suggests the importance of genetic testing at early stages.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Prediction performance (AUROC) 0 months to 24 months in advance.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td>Months</td>
                <td colspan="8">Feature type</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>DML+G<sup>a</sup></td>
                <td>Diagnosis, medication, and lab test</td>
                <td>Diagnosis and lab test</td>
                <td>Diagnosis and medication</td>
                <td>Medication and lab test</td>
                <td>Diagnosis</td>
                <td>Medication</td>
                <td>Lab test</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AUROC<sup>b</sup> (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
                <td>AUROC (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0</td>
                <td>99.43</td>
                <td>98.36</td>
                <td>98.41</td>
                <td>97.89</td>
                <td>88.67</td>
                <td>97.90</td>
                <td>70.39</td>
                <td>87.93</td>
              </tr>
              <tr valign="top">
                <td>1</td>
                <td>98.08</td>
                <td>95.62</td>
                <td>95.51</td>
                <td>94.31</td>
                <td>86.83</td>
                <td>94.53</td>
                <td>71.01</td>
                <td>86.67</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>96.52</td>
                <td>93.16</td>
                <td>93.22</td>
                <td>90.74</td>
                <td>84.85</td>
                <td>91.20</td>
                <td>69.36</td>
                <td>84.18</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>95.21</td>
                <td>89.69</td>
                <td>89.91</td>
                <td>85.53</td>
                <td>83.09</td>
                <td>85.26</td>
                <td>68.12</td>
                <td>83.38</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>93.17</td>
                <td>84.39</td>
                <td>84.60</td>
                <td>78.20</td>
                <td>80.56</td>
                <td>78.21</td>
                <td>66.76</td>
                <td>79.99</td>
              </tr>
              <tr valign="top">
                <td>24</td>
                <td>91.38</td>
                <td>80.01</td>
                <td>80.20</td>
                <td>71.81</td>
                <td>77.73</td>
                <td>71.71</td>
                <td>66.22</td>
                <td>78.35</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>DML+G: diagnosis, medication, and lab test, and genetic information.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Prediction of Patients With Cancer of Unknown Primary</title>
        <p>In spite of the challenge in identifying patients with cancer of unknown primary in the clinical setting, hybrid features—the diagnosis, medication, lab test, and genetic information model—outperformed the diagnosis, medication, and lab test model (AUPRC: Table S5, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), and bag of features+Node2vec outperform the bag of features and Node2vec in most cases. <xref ref-type="table" rid="table6">Table 6</xref> shows promising prediction results for 4 cancers, especially for breast (AUROC 92.31%), connective and other soft tissue (AUROC 92.31%). Cancers of the liver and lung have the largest number of patients (24/43) and also achieved satisfactory predictions (AUROCs 88.21% and 85.51%). We also note that the proposed method performed suboptimally in predicting cancer of the colon (AUROC 52.56%). Prediction of the prostate, thyroid gland, and colon cancers had better results for the bag of features+Node2vec model with diagnosis, medication, and lab test features and for the bag of features or Node2vec model with diagnosis, medication, lab test, and genetic information features (Table S6, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), suggesting a more flexible strategy of model adaptation for the prediction of cancer of unknown primary in practice.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>AUROC (%) of prediction for 9 cancer types.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="660"/>
            <col width="100"/>
            <col width="150"/>
            <col width="0"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td>Cancer (ICD-9<sup>a</sup> code)</td>
                <td colspan="3"> AUROC<sup>b</sup> (%)</td>
                <td>Patients, n</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>DML<sup>c</sup></td>
                <td>DML+G<sup>d</sup></td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Malignant neoplasm of breast (female), unspecified (174.9)</td>
                <td>83.97</td>
                <td>92.31</td>
                <td colspan="2">4</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of connective and other soft tissue, site unspecified (171.9)</td>
                <td>53.21</td>
                <td>92.31</td>
                <td colspan="2">4</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of liver, primary (155)</td>
                <td>84.10</td>
                <td>88.21</td>
                <td colspan="2">13</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of bronchus and lung, unspecified (162.9)</td>
                <td>74.43</td>
                <td>85.51</td>
                <td colspan="2">11</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of ovary (183)</td>
                <td>65.85</td>
                <td>80.49</td>
                <td colspan="2">2</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of prostate (185)</td>
                <td>91.67</td>
                <td>79.17</td>
                <td colspan="2">3</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of thyroid gland (193)</td>
                <td>90.24</td>
                <td>75.61</td>
                <td colspan="2">2</td>
              </tr>
              <tr valign="top">
                <td>Malignant neoplasm of colon, unspecified site (153.9)</td>
                <td>64.74</td>
                <td>52.56</td>
                <td colspan="2">4</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>ICD-9: International Statistical Classification of Diseases, ninth revision.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table6fn3">
              <p><sup>c</sup>DML: diagnosis, medication, and lab test.</p>
            </fn>
            <fn id="table6fn4">
              <p><sup>d</sup>DML+G: diagnosis, medication, and lab test, and genetic information.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>It is recognized that both genetic and nongenetic factors may lead to the development of cancers, and they are, therefore, considered to be risk factors in the plethora of cancer prediction models based on statistical analysis; this leads to performance (eg, AUROC) ranging from 60% to 90% [<xref ref-type="bibr" rid="ref77">77</xref>]. For example, the variables of high DNA load of high-risk human papillomavirus, age, marital status, smoking status, and age at sexual debut are the critical factors to achieve the AUROC 90% in the prediction of cervical intraepithelial neoplasia grade 2 or worse [<xref ref-type="bibr" rid="ref78">78</xref>]. DNA methylation-based markers-based method achieves AUROC 93% in the detection of preinvasive neoplasia and cervical cancer [<xref ref-type="bibr" rid="ref79">79</xref>]. Computational methods (eg, machine learning and deep learning) have been adapted to provide solutions for cancer prediction challenges in a controlled environment (eg, UCI machine repository [<xref ref-type="bibr" rid="ref80">80</xref>]). For example, linear support vector machines achieved AUROC 96.7% [<xref ref-type="bibr" rid="ref81">81</xref>] and k-nearest neighbors classifier achieved an accuracy of 99.28% [<xref ref-type="bibr" rid="ref82">82</xref>] for breast cancer prediction.</p>
      <p>Public genetic expression databases (eg, The Cancer Genome Atlas) are frequently used to train diverse deep learning models. A convolutional neural network–based model achieved accuracies of 93.9% to 95.0% in the prediction of 34 cancer types [<xref ref-type="bibr" rid="ref83">83</xref>]. For lung, stomach, and breast cancer, AUROCs 99.5%, 97.1%, and 95.0%, respectively, were achieved by a stacked sparse auto-encoder–based classification model [<xref ref-type="bibr" rid="ref84">84</xref>]. Prostate cancer prediction achieved an AUROC of 95.5% with a genetic algorithm–optimized artificial neural network [<xref ref-type="bibr" rid="ref85">85</xref>]. Accuracies of 95.3% for breast cancer, 57.9% for leukemia, and 84.9% for colon cancer were achieved by sample expansion based 1D convolutional neural network [<xref ref-type="bibr" rid="ref86">86</xref>].</p>
      <p>Electronic health records are utilized in cancer prediction. DeepPatient has proposed a novel unsupervised feature learning method based on autoencoders for disease prediction [<xref ref-type="bibr" rid="ref87">87</xref>]. The overall AUROC was 77.3%, where AUROCs of 88.7% for cancer of rectum and anus, 88.6% for cancer of the liver and intrahepatic bile duct, 85.9% for cancer of the prostate were predicted with a time interval of 12 months. Multiple studies have utilized electronic health record data to predict specific cancers, where AUROCs of 88.1% for lung cancer [<xref ref-type="bibr" rid="ref88">88</xref>], 64.8% for breast cancer [<xref ref-type="bibr" rid="ref89">89</xref>], 85% for pancreatic cancer [<xref ref-type="bibr" rid="ref90">90</xref>] were achieved, and 85.7% precision and 60.0% recall were achieved for colorectal cancer [<xref ref-type="bibr" rid="ref91">91</xref>]. Our method achieved AUROC 96.56% in general and outperformed the state-of-the-art methods for most cancer types. Specifically, prostate cancer (99.8%), breast cancer (AUROC 98.5%), liver cancer (95.4%), and pancreas cancer (95.4%) predictions results were better for our method.</p>
      <p>In this study, we designed and developed a network-based framework leveraging the FHIR resources and RDF for cancer prediction. Our contributions can be summarized as exploration of utilizing FHIR and RDF technology to provide a network-based representation for the prediction of patient health status, demonstrating the value of integrating the phenotypic and genetic features data sources to improve the accuracy and interpretability in cancer prediction models. To enable the standard representation of data, a FHIR-based representation was used as the core to support the network population and feature generation. It is one of the most popular clinical data standards and is widely used among modern electronic health record vendors and data providers, enabling the plug and play functionality of the proposed method to be used across the different institutions, and it provides the specification and tools to seamlessly convert to RDF format and support the efficient data communication based on the popular data exchanging formats, such as XML or JavaScript object notation.</p>
      <p>This study demonstrated a solution for the prediction of unknown cancer in clinical practice. Despite the value of this work, there are several limitations that should be addressed.</p>
      <p>First, the genetic alterations in the genetic reports provided in Foundation Medicine are all somatic mutations in tumors and are collected from somatic tissues. Thus, we could not differentiate the germline and somatic mutations in our model. The bias introduced to the system caused by a failure in capturing this difference weakens the findings of our study.</p>
      <p>Second, as most genetic tests are based on specimens collected from the biopsy or surgery, the best-performing (diagnosis, medication, lab test, and genetic information) model introduced in Task 5 might not be adaptable as some medical organizations have limited access to genetic information available for study. We, therefore, consider that it is more practical to learn a large amount of phenotypical information for cancer prediction with the full utilization of existing generic information. On the other hand, as the costs of genetic testing are reduced, we believe that the genetic information will be increasingly used in prediction models for different tasks, which makes the proposed method a good reference as a pilot study.</p>
      <p>Third, within 81 patients who have been documented as having cancer of unknown primary (from genetic reports), we could identify specific cancer types for 43 patients based on the review of patients' diagnostic report for task 6. We understand that the limited data set used might affect result analysis, which is a limitation of this experiment. We also noticed that the proposed method performs differently in task 6, especially with some notable failures. Such failures indicate the patterns of the value distribution for the features learned in the training data are not the same as the patterns in the cancer of unknown primary. The cancer of unknown primary source is not considered a single type of cancer and is known to spread at the early stage without causing phenotypical symptoms at the origin site [<xref ref-type="bibr" rid="ref92">92</xref>]. As such, the proposed model is affected in Task 5 accordingly.</p>
      <p>Fourth, our experiment demonstrates the performance of the proposed method based on data collected over a varying timeline. Data were used in isolation to train classification models, ignoring the continuous changing of the measurable values of phenotypes (eg, lab tests) during cancer progression. The introduction of deep learning models, such as recurring neural networks [<xref ref-type="bibr" rid="ref93">93</xref>] and long short-term memory [<xref ref-type="bibr" rid="ref94">94</xref>], which are capable of processing time-series data may potentially improve predictions.</p>
      <p>Fifth, cancers related to the same genetic alteration (eg, both colorectal and gastric cancers are related to the <italic>APC</italic> gene) inspire us to explore the potential of considering dependent phenotypes of the genetic alteration. With the utilization of phenotype and genotype dependence based on the ontology structure, a more sophisticated method can be designed to empower the prediction. In the future, we plan to reach out to other institutions to apply our method both with and without genetic information on diverse electronic health record systems. We consider it is necessary to adopt other medical data standards, such as Observational Health Data Sciences and Informatics Common Data Model [<xref ref-type="bibr" rid="ref95">95</xref>], to cover the diversity. We are aware that there are some challenging issues in genetic data modeling with relational databases, such as how to anonymize and aggregate genomic data. We believe that the research community will develop solutions for handling these challenging issues. We will incorporate such developments into our framework as part of future work to better support these requirements. The data process and cancer prediction tools of this study are publicly available [<xref ref-type="bibr" rid="ref96">96</xref>].</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary tables.</p>
        <media xlink:href="medinform_v9i5e23586_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 16 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUPRC</term>
          <def>
            <p>area under the precision–recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ICD</term>
          <def>
            <p>International Statisitical Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">FHIR</term>
          <def>
            <p>Fast Healthcare Interoperability Resources</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RDF</term>
          <def>
            <p>Resource Description Framework</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ReLU</term>
          <def>
            <p>rectified linear unit</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by funding from Genentech Research Fund in Individualized Medicine, National Institute of Health, National Institute of General Medical Sciences (K99GM135488), Big Data to Knowledge (U01HG009450), and FHIRCat (R56EB028101).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer</article-title>
          <source>World Health Organization</source>
          <year>2018</year>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/cancer">https://www.who.int/news-room/fact-sheets/detail/cancer</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islami</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Cancer burden in the United States—a review</article-title>
          <source>Ann Cancer Epidemiol</source>
          <year>2018</year>
          <volume>1</volume>
          <fpage>1</fpage>
          <lpage>1</lpage>
          <pub-id pub-id-type="doi">10.21037/ace.2018.08.02</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Leading causes of death</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2017</year>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchs/fastats/leading-causes-of-death.htm">https://www.cdc.gov/nchs/fastats/leading-causes-of-death.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer statistics</article-title>
          <source>National Cancer Institute</source>
          <year>2020</year>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancer.gov/about-cancer/understanding/statistics">https://www.cancer.gov/about-cancer/understanding/statistics</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hass</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Meyers</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Cancer stem cells</article-title>
          <source>Reviews in Cell Biology and Molecular Medicine</source>
          <year>2004</year>
          <publisher-loc>Weinheim</publisher-loc>
          <publisher-name>Wiley‐VCH Verlag GmbH &#38; Co KGaA</publisher-name>
          <fpage>221</fpage>
          <lpage>241</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blackadar</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>Historical review of the causes of cancer</article-title>
          <source>World J Clin Oncol</source>
          <year>2016</year>
          <month>02</month>
          <day>10</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>54</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wjgnet.com/2218-4333/full/v7/i1/54.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.5306/wjco.v7.i1.54</pub-id>
          <pub-id pub-id-type="medline">26862491</pub-id>
          <pub-id pub-id-type="pmcid">PMC4734938</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cadoo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Salo-Mullen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dubard-Gault</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stadler</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Offit</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Genetic factors: hereditary cancer predisposition syndromes</article-title>
          <source>Abeloff's Clinical Oncology</source>
          <year>2020</year>
          <publisher-loc>Amsterdam, Netherlands</publisher-loc>
          <publisher-name>Elsevier</publisher-name>
          <fpage>180</fpage>
          <lpage>208</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garber</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Offit</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Hereditary cancer predisposition syndromes</article-title>
          <source>J Clin Oncol</source>
          <year>2005</year>
          <month>01</month>
          <day>10</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>276</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1200/JCO.2005.10.042</pub-id>
          <pub-id pub-id-type="medline">15637391</pub-id>
          <pub-id pub-id-type="pii">23/2/276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nagy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sweet</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Eng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Highly penetrant hereditary cancer syndromes</article-title>
          <source>Oncogene</source>
          <year>2004</year>
          <month>08</month>
          <day>23</day>
          <volume>23</volume>
          <issue>38</issue>
          <fpage>6445</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1038/sj.onc.1207714</pub-id>
          <pub-id pub-id-type="medline">15322516</pub-id>
          <pub-id pub-id-type="pii">1207714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Letai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Flaherty</surname>
              <given-names>KT</given-names>
            </name>
          </person-group>
          <article-title>Precision medicine for cancer with next-generation functional diagnostics</article-title>
          <source>Nat Rev Cancer</source>
          <year>2015</year>
          <month>12</month>
          <volume>15</volume>
          <issue>12</issue>
          <fpage>747</fpage>
          <lpage>56</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26536825"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrc4015</pub-id>
          <pub-id pub-id-type="medline">26536825</pub-id>
          <pub-id pub-id-type="pii">nrc4015</pub-id>
          <pub-id pub-id-type="pmcid">PMC4970460</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nath</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Pal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mukhopadhyay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mondal</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>A survey on cancer prediction and detection with data analysis</article-title>
          <source>Innovations Syst Softw Eng</source>
          <year>2019</year>
          <month>08</month>
          <day>22</day>
          <volume>16</volume>
          <issue>3-4</issue>
          <fpage>231</fpage>
          <lpage>243</lpage>
          <pub-id pub-id-type="doi">10.1007/s11334-019-00350-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer survival in England: national estimates for patients followed up to 2017</article-title>
          <source>Office for National Statistics</source>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ons.gov.uk/releases/cancersurvivalinenglandadultstageatdiagnosisandchildhoodpatientsfollowedupto2017">https://www.ons.gov.uk/releases/cancersurvivalinenglandadultstageatdiagnosisandchildhoodpatientsfollowedupto2017</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hawkes</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Cancer survival data emphasise importance of early diagnosis</article-title>
          <source>BMJ</source>
          <year>2019</year>
          <month>01</month>
          <day>25</day>
          <volume>364</volume>
          <fpage>l408</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.l408</pub-id>
          <pub-id pub-id-type="medline">30683652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <article-title>Tests for cancer of unknown primary</article-title>
          <source>American Cancer Society</source>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancer.org/cancer/cancer-unknown-primary/detection-diagnosis-staging/how-diagnosed.html">https://www.cancer.org/cancer/cancer-unknown-primary/detection-diagnosis-staging/how-diagnosed.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Losa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Soler</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Casado</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Estival</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fernández</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Giménez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Longo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pazo-Cid</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Salgado</surname>
              <given-names>J</given-names>
            </name>
            <collab>Seguí</collab>
          </person-group>
          <article-title>SEOM clinical guideline on unknown primary cancer (2017)</article-title>
          <source>Clin Transl Oncol</source>
          <year>2018</year>
          <month>01</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>89</fpage>
          <lpage>96</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29230692"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12094-017-1807-y</pub-id>
          <pub-id pub-id-type="medline">29230692</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12094-017-1807-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC5785607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cowie</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Blomster</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Duclaux</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Goldman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Janmohamed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kreuzer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Leenay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pell</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Southworth</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Stough</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Thoenes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zannad</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zalewski</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Electronic health records to facilitate clinical research</article-title>
          <source>Clin Res Cardiol</source>
          <year>2017</year>
          <month>01</month>
          <volume>106</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27557678"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00392-016-1025-6</pub-id>
          <pub-id pub-id-type="medline">27557678</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00392-016-1025-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5226988</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denaxas</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Morley</surname>
              <given-names>KI</given-names>
            </name>
          </person-group>
          <article-title>Big biomedical data and cardiovascular disease research: opportunities and challenges</article-title>
          <source>Eur Heart J Qual Care Clin Outcomes</source>
          <year>2015</year>
          <month>07</month>
          <day>01</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>9</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1093/ehjqcco/qcv005</pub-id>
          <pub-id pub-id-type="medline">29474568</pub-id>
          <pub-id pub-id-type="pii">1860292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in healthcare: past, present and future</article-title>
          <source>Stroke Vasc Neurol</source>
          <year>2017</year>
          <month>12</month>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>230</fpage>
          <lpage>243</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29507784"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/svn-2017-000101</pub-id>
          <pub-id pub-id-type="medline">29507784</pub-id>
          <pub-id pub-id-type="pii">svn-2017-000101</pub-id>
          <pub-id pub-id-type="pmcid">PMC5829945</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hajaj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hardt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sundberg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Irvine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Litsch</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mossin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tansuwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wexler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volchenboum</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madabushi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scalable and accurate deep learning with electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <volume>1</volume>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-018-0029-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id>
          <pub-id pub-id-type="medline">31304302</pub-id>
          <pub-id pub-id-type="pii">29</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prince</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Computer Vision: Models, Learning, and Inference</source>
          <year>2012</year>
          <publisher-loc>Cambridge, UK</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>RSN</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Drug-target prediction utilizing heterogeneous bio-linked network embeddings</article-title>
          <source>Brief Bioinform</source>
          <year>2021</year>
          <month>01</month>
          <day>18</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>568</fpage>
          <lpage>580</lpage>
          <pub-id pub-id-type="doi">10.1093/bib/bbz147</pub-id>
          <pub-id pub-id-type="medline">31885036</pub-id>
          <pub-id pub-id-type="pii">5681788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bader</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Patient similarity networks for precision medicine</article-title>
          <source>J Mol Biol</source>
          <year>2018</year>
          <month>09</month>
          <day>14</day>
          <volume>430</volume>
          <issue>18 Pt A</issue>
          <fpage>2924</fpage>
          <lpage>2938</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0022-2836(18)30532-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jmb.2018.05.037</pub-id>
          <pub-id pub-id-type="medline">29860027</pub-id>
          <pub-id pub-id-type="pii">S0022-2836(18)30532-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6097926</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bender</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sartipi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>HL7 FHIR: an Agile and RESTful approach to healthcare information exchange</article-title>
          <source>Proceedings of the 26th IEEE international symposium on computer-based medical systems</source>
          <year>2013</year>
          <conf-name>IEEE international symposium on computer-based medical systems</conf-name>
          <conf-date>June 20-22</conf-date>
          <conf-loc>Porto, Portugal</conf-loc>
          <pub-id pub-id-type="doi">10.1109/cbms.2013.6627810</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grover</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leskovec</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>node2vec: scalable feature learning for networks</article-title>
          <source>KDD</source>
          <year>2016</year>
          <month>08</month>
          <volume>2016</volume>
          <fpage>855</fpage>
          <lpage>864</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27853626"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2939672.2939754</pub-id>
          <pub-id pub-id-type="medline">27853626</pub-id>
          <pub-id pub-id-type="pmcid">PMC5108654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mandel</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Kreda</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Ramoni</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>SMART on FHIR: a standards-based, interoperable apps platform for electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>02</month>
          <day>17</day>
          <fpage>899</fpage>
          <lpage>908</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=26911829"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv189</pub-id>
          <pub-id pub-id-type="medline">26911829</pub-id>
          <pub-id pub-id-type="pii">ocv189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>SNOMED-CT: The advanced terminology and coding system for eHealth</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2006</year>
          <volume>121</volume>
          <fpage>279</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="medline">17095826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Huff</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Suico</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Leavelle</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Aller</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Forrey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mercer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>DeMoor</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hook</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Case</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Maloney</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>LOINC, a universal standard for identifying laboratory observations: a 5-year update</article-title>
          <source>Clin Chem</source>
          <year>2003</year>
          <month>04</month>
          <volume>49</volume>
          <issue>4</issue>
          <fpage>624</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.clinchem.org/cgi/pmidlookup?view=long&#38;pmid=12651816"/>
          </comment>
          <pub-id pub-id-type="medline">12651816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <article-title>International Statistical Classification of Diseases and Related Health Problems (ICD)</article-title>
          <source>World Health Organization</source>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.who.int/classifications/icd/en/">http://www.who.int/classifications/icd/en/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Decker</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Melnik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>van Harmelen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Fensel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Broekstra</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Erdmann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Horrocks</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>The Semantic Web: the roles of XML and RDF</article-title>
          <source>IEEE Internet Comput</source>
          <year>2000</year>
          <volume>4</volume>
          <issue>5</issue>
          <fpage>63</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1109/4236.877487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaggal</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Elayavilli</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pankratz</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhry</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Buntrock</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Toward a learning health-care system - knowledge delivery at the point of care empowered by big data and NLP</article-title>
          <source>Biomed Inform Insights</source>
          <year>2016</year>
          <volume>8</volume>
          <issue>Suppl 1</issue>
          <fpage>13</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27385912"/>
          </comment>
          <pub-id pub-id-type="doi">10.4137/BII.S37977</pub-id>
          <pub-id pub-id-type="medline">27385912</pub-id>
          <pub-id pub-id-type="pii">bii-suppl.1-2016-013</pub-id>
          <pub-id pub-id-type="pmcid">PMC4920204</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Slee</surname>
              <given-names>VN</given-names>
            </name>
          </person-group>
          <article-title>The international classification of diseases: ninth revision (ICD-9)</article-title>
          <source>Ann Intern Med</source>
          <year>1978</year>
          <month>03</month>
          <day>01</day>
          <volume>88</volume>
          <issue>3</issue>
          <fpage>424</fpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-88-3-424</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <collab>Wei Ma</collab>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ganesan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>RxNorm: prescription for electronic drug information exchange</article-title>
          <source>IT Prof</source>
          <year>2005</year>
          <month>09</month>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>17</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1109/mitp.2005.122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Developing a scalable FHIR-based clinical data normalization pipeline for standardizing and integrating unstructured and structured electronic health record data</article-title>
          <source>JAMIA Open</source>
          <year>2019</year>
          <month>12</month>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>570</fpage>
          <lpage>579</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32025655"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooz056</pub-id>
          <pub-id pub-id-type="medline">32025655</pub-id>
          <pub-id pub-id-type="pii">ooz056</pub-id>
          <pub-id pub-id-type="pmcid">PMC6993992</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Masanz</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ogren</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kipper-Schuler</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Mayo clinical Text Analysis and Knowledge Extraction System (cTAKES): architecture, component evaluation and applications</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>507</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/lookup/pmidlookup?view=long&#38;pmid=20819853"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.001560</pub-id>
          <pub-id pub-id-type="medline">20819853</pub-id>
          <pub-id pub-id-type="pii">17/5/507</pub-id>
          <pub-id pub-id-type="pmcid">PMC2995668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Halgrim</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>MedXN: an open source medication extraction and normalization tool for clinical text</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>5</issue>
          <fpage>858</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24637954"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002190</pub-id>
          <pub-id pub-id-type="medline">24637954</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-002190</pub-id>
          <pub-id pub-id-type="pmcid">PMC4147619</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>MedTime: a temporal information extraction system for clinical narratives</article-title>
          <source>J Biomed Inform</source>
          <year>2013</year>
          <month>12</month>
          <volume>46 Suppl</volume>
          <fpage>S20</fpage>
          <lpage>S28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00113-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2013.07.012</pub-id>
          <pub-id pub-id-type="medline">23911344</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(13)00113-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Egan</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Davila</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Developing a FHIR-based framework for phenome wide association studies: a case study with a pan-cancer cohort</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>750</fpage>
          <lpage>759</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32477698"/>
          </comment>
          <pub-id pub-id-type="medline">32477698</pub-id>
          <pub-id pub-id-type="pmcid">PMC7233075</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Hara</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Draper</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Introduction to the bag of features paradigm for image classification and retrieval</article-title>
          <source>arXiv. Preprint posted online on Jan 17,</source>
          <year>2011</year>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wiener</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Classification and regression by randomForest</article-title>
          <source>R news</source>
          <year>2002</year>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>18</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.r-project.org/doc/Rnews/Rnews_2002-3.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Naive Bayes classification algorithm based on small sample set</article-title>
          <year>2011</year>
          <conf-name>IEEE International Conference on Cloud Computing and Intelligence Systems</conf-name>
          <conf-date>September 15-17</conf-date>
          <conf-loc>Beijing, China</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ccis.2011.6045027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>STC</given-names>
            </name>
          </person-group>
          <article-title>Cancer classification and prediction using logistic regression with Bayesian gene selection</article-title>
          <source>J Biomed Inform</source>
          <year>2004</year>
          <month>08</month>
          <volume>37</volume>
          <issue>4</issue>
          <fpage>249</fpage>
          <lpage>59</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(04)00077-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2004.07.009</pub-id>
          <pub-id pub-id-type="medline">15465478</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(04)00077-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noble</surname>
              <given-names>WS</given-names>
            </name>
          </person-group>
          <article-title>What is a support vector machine?</article-title>
          <source>Nat Biotechnol</source>
          <year>2006</year>
          <month>12</month>
          <volume>24</volume>
          <issue>12</issue>
          <fpage>1565</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1038/nbt1206-1565</pub-id>
          <pub-id pub-id-type="medline">17160063</pub-id>
          <pub-id pub-id-type="pii">nbt1206-1565</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Alsaadi</surname>
              <given-names>FE</given-names>
            </name>
          </person-group>
          <article-title>A survey of deep neural network architectures and their applications</article-title>
          <source>Neurocomputing</source>
          <year>2017</year>
          <month>04</month>
          <volume>234</volume>
          <fpage>11</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2016.12.038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Giles</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Tsoi</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Back</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>Face recognition: a convolutional neural-network approach</article-title>
          <source>IEEE Trans Neural Netw</source>
          <year>1997</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>98</fpage>
          <lpage>113</lpage>
          <pub-id pub-id-type="doi">10.1109/72.554195</pub-id>
          <pub-id pub-id-type="medline">18255614</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kipf</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Welling</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Semi-supervised classification with graph convolutional networks</article-title>
          <source>arXiv. Preprint posted online on February 22,</source>
          <year>2017</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1609.02907.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Azhagusundari</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Thanamani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Feature selection based on information gain</article-title>
          <source>Int J Innov Technol Explor Eng</source>
          <year>2013</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>18</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ijitee.org/wp-content/uploads/papers/v2i2/B0352012213.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <article-title>node2vec</article-title>
          <source>GitHub</source>
          <access-date>2011-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/aditya-grover/node2vec">https://github.com/aditya-grover/node2vec</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Machine Learning Group</collab>
          </person-group>
          <article-title>LIBLINEAR -- a library for large linear classification</article-title>
          <source>Taiwan University</source>
          <access-date>2021-05-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.csie.ntu.edu.tw/~cjlin/liblinear/">https://www.csie.ntu.edu.tw/~cjlin/liblinear/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <article-title>Weka</article-title>
          <source>The University of Waikato</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cs.waikato.ac.nz/ml/weka/">https://www.cs.waikato.ac.nz/ml/weka/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C-C</given-names>
            </name>
            <name name-style="western">
              <surname>Line</surname>
              <given-names>C-J</given-names>
            </name>
          </person-group>
          <article-title>LIBSVM -- a library for support vector machines</article-title>
          <source>Taiwan University</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.csie.ntu.edu.tw/~cjlin/libsvm/">https://www.csie.ntu.edu.tw/~cjlin/libsvm/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <article-title>Keras API reference</article-title>
          <source>Keras</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://keras.io/api/">https://keras.io/api/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <article-title>specktral</article-title>
          <source>GitHub</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/danielegrattarola/spektral">https://github.com/danielegrattarola/spektral</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Goadrich</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The relationship between precision-recall and ROC curves</article-title>
          <source>Proceedings of the 23rd International Conference on Machine Learning</source>
          <year>2006</year>
          <conf-name>23rd International Conference on Machine Learning</conf-name>
          <conf-date>June 25-29</conf-date>
          <conf-loc>Pittsburgh, Pennsylvania</conf-loc>
          <fpage>233</fpage>
          <lpage>240</lpage>
          <pub-id pub-id-type="doi">10.1145/1143844.1143874</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bouzerdoum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Phung</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>P-Y</given-names>
            </name>
          </person-group>
          <article-title>Learning pattern classification tasks with imbalanced data sets</article-title>
          <source>Pattern Recognition</source>
          <year>2009</year>
          <publisher-loc>London, United Kingdom</publisher-loc>
          <publisher-name>InTech Open</publisher-name>
          <fpage>193</fpage>
          <lpage>208</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeni</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>De La Torre</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Facing imbalanced data recommendations for the use of performance metrics</article-title>
          <source>Int Conf Affect Comput Intell Interact Workshops</source>
          <year>2013</year>
          <volume>2013</volume>
          <fpage>245</fpage>
          <lpage>251</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25574450"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/ACII.2013.47</pub-id>
          <pub-id pub-id-type="medline">25574450</pub-id>
          <pub-id pub-id-type="pmcid">PMC4285355</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <article-title>Roc</article-title>
          <source>GitHub</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/kboyd/Roc">https://github.com/kboyd/Roc</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Donkin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Witten</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>WEKA: a machine learning workbench</article-title>
          <year>1994</year>
          <conf-name>Second Australian and New Zealand Conference on Intelligent Information Systems</conf-name>
          <conf-date>November 29-December 2</conf-date>
          <conf-loc>Brisbane</conf-loc>
          <pub-id pub-id-type="doi">10.1109/anziis.1994.396988</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woolson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Massaro</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Wilcoxon signed-rank test</article-title>
          <source>Wiley Encyclopedia of Clinical Trials</source>
          <year>2007</year>
          <publisher-loc>Hoboken, New Jersey</publisher-loc>
          <publisher-name>John Wiley &#38; Sons, Inc</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S-I</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <year>2017</year>
          <conf-name>Advances in Neural Information Processing Systems 30</conf-name>
          <conf-date>December 4-9</conf-date>
          <conf-loc>Long Beach, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ba</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Clinical use of tumor biomarkers in prediction for prognosis and chemotherapeutic effect in esophageal squamous cell carcinoma</article-title>
          <source>BMC Cancer</source>
          <year>2019</year>
          <month>05</month>
          <day>31</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>526</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmccancer.biomedcentral.com/articles/10.1186/s12885-019-5755-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12885-019-5755-5</pub-id>
          <pub-id pub-id-type="medline">31151431</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12885-019-5755-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6544972</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scarà</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bottoni</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Scatena</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>CA 19-9: biochemical and clinical aspects</article-title>
          <source>Adv Exp Med Biol</source>
          <year>2015</year>
          <volume>867</volume>
          <fpage>247</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1007/978-94-017-7215-0_15</pub-id>
          <pub-id pub-id-type="medline">26530370</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Høgdall</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Cancer antigen 125 and prognosis</article-title>
          <source>Curr Opin Obstet Gynecol</source>
          <year>2008</year>
          <month>02</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>4</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/GCO.0b013e3282f2b124</pub-id>
          <pub-id pub-id-type="medline">18196998</pub-id>
          <pub-id pub-id-type="pii">00001703-200802000-00003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Prognostic role of serum carbohydrate antigen 19-9 levels in patients with resectable hepatocellular carcinoma</article-title>
          <source>Tumour Biol</source>
          <year>2015</year>
          <month>04</month>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>2257</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.1007/s13277-014-2435-6</pub-id>
          <pub-id pub-id-type="medline">25787748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>KRAS: a promising therapeutic target for cancer treatment</article-title>
          <source>Curr Top Med Chem</source>
          <year>2019</year>
          <volume>19</volume>
          <issue>23</issue>
          <fpage>2081</fpage>
          <lpage>2097</lpage>
          <pub-id pub-id-type="doi">10.2174/1568026619666190905164144</pub-id>
          <pub-id pub-id-type="medline">31486755</pub-id>
          <pub-id pub-id-type="pii">CTMC-EPUB-100667</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hankey</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Frankel</surname>
              <given-names>WL</given-names>
            </name>
            <name name-style="western">
              <surname>Groden</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Functions of the APC tumor suppressor protein dependent and independent of canonical WNT signaling: implications for therapeutic targeting</article-title>
          <source>Cancer Metastasis Rev</source>
          <year>2018</year>
          <month>03</month>
          <volume>37</volume>
          <issue>1</issue>
          <fpage>159</fpage>
          <lpage>172</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29318445"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10555-017-9725-6</pub-id>
          <pub-id pub-id-type="medline">29318445</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10555-017-9725-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5803335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>High expression of  is an unfavorable prognostic biomarker in T4 gastric cancer patients</article-title>
          <source>World J Gastroenterol</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>25</volume>
          <issue>31</issue>
          <fpage>4452</fpage>
          <lpage>4467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wjgnet.com/1007-9327/full/v25/i31/4452.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.3748/wjg.v25.i31.4452</pub-id>
          <pub-id pub-id-type="medline">31496624</pub-id>
          <pub-id pub-id-type="pmcid">PMC6710185</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yassin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>AlRumaihi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Alzubaidi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alkadhi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Al Ansari</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Testosterone, testosterone therapy and prostate cancer</article-title>
          <source>Aging Male</source>
          <year>2019</year>
          <month>12</month>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>219</fpage>
          <lpage>227</lpage>
          <pub-id pub-id-type="doi">10.1080/13685538.2018.1524456</pub-id>
          <pub-id pub-id-type="medline">30614347</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michaud</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Billups</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Partin</surname>
              <given-names>AW</given-names>
            </name>
          </person-group>
          <article-title>Testosterone and prostate cancer: an evidence-based review of pathogenesis and oncologic risk</article-title>
          <source>Ther Adv Urol</source>
          <year>2015</year>
          <month>12</month>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>378</fpage>
          <lpage>87</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/1756287215597633?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1756287215597633</pub-id>
          <pub-id pub-id-type="medline">26622322</pub-id>
          <pub-id pub-id-type="pii">10.1177_1756287215597633</pub-id>
          <pub-id pub-id-type="pmcid">PMC4647137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hershman</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Falling levels of thyroglobulin antibody after treatment for DTC predict no structural recurrence</article-title>
          <source>Clin Thyroidol</source>
          <year>2016</year>
          <month>03</month>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>79</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1089/ct.2016;28.79-81</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peiris</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Medlock</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gavin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Thyroglobulin for monitoring for thyroid cancer recurrence</article-title>
          <source>JAMA</source>
          <year>2019</year>
          <month>03</month>
          <day>26</day>
          <volume>321</volume>
          <issue>12</issue>
          <fpage>1228</fpage>
          <pub-id pub-id-type="doi">10.1001/jama.2019.0803</pub-id>
          <pub-id pub-id-type="medline">30912839</pub-id>
          <pub-id pub-id-type="pii">2728926</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Baek</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Son</surname>
              <given-names>HY</given-names>
            </name>
          </person-group>
          <article-title>Thyroglobulin antibody is associated with increased cancer risk in thyroid nodules</article-title>
          <source>Thyroid</source>
          <year>2010</year>
          <month>08</month>
          <volume>20</volume>
          <issue>8</issue>
          <fpage>885</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1089/thy.2009.0384</pub-id>
          <pub-id pub-id-type="medline">20465529</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Santhanam</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ladenson</surname>
              <given-names>PW</given-names>
            </name>
          </person-group>
          <article-title>Surveillance for differentiated thyroid cancer recurrence</article-title>
          <source>Endocrinol Metab Clin North Am</source>
          <year>2019</year>
          <month>03</month>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>239</fpage>
          <lpage>252</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ecl.2018.11.008</pub-id>
          <pub-id pub-id-type="medline">30717906</pub-id>
          <pub-id pub-id-type="pii">S0889-8529(18)30595-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The role of TERT promoter mutations in postoperative and preoperative diagnosis and prognosis in thyroid cancer</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2018</year>
          <month>07</month>
          <volume>97</volume>
          <issue>29</issue>
          <fpage>e11548</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1097/MD.0000000000011548"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000011548</pub-id>
          <pub-id pub-id-type="medline">30024548</pub-id>
          <pub-id pub-id-type="pii">00005792-201807200-00055</pub-id>
          <pub-id pub-id-type="pmcid">PMC6086515</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Clinicopathological and prognostic significance of cancer antigen 15-3 and carcinoembryonic antigen in breast cancer: a meta-analysis including 12,993 patients</article-title>
          <source>Dis Markers</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>9863092</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2018/9863092"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2018/9863092</pub-id>
          <pub-id pub-id-type="medline">29854028</pub-id>
          <pub-id pub-id-type="pmcid">PMC5954898</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zimdahl</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Horan</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Diaz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nakano</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Staley</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Priceman</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Forman</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>VW</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Targeting alpha-fetoprotein (AFP)-MHC complex with CAR T-cell therapy for liver cancer</article-title>
          <source>Clin Cancer Res</source>
          <year>2017</year>
          <month>01</month>
          <day>15</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>478</fpage>
          <lpage>488</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://clincancerres.aacrjournals.org/cgi/pmidlookup?view=long&#38;pmid=27535982"/>
          </comment>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-16-1203</pub-id>
          <pub-id pub-id-type="medline">27535982</pub-id>
          <pub-id pub-id-type="pii">1078-0432.CCR-16-1203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bethune</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bethune</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ridgway</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Epidermal growth factor receptor (EGFR) in lung cancer: an overview and update</article-title>
          <source>J Thorac Dis</source>
          <year>2010</year>
          <month>03</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>48</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22263017"/>
          </comment>
          <pub-id pub-id-type="medline">22263017</pub-id>
          <pub-id pub-id-type="pmcid">PMC3256436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Widschwendter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Reisel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dillner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sundström</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Vergouwe</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wegwarth</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rebitschek</surname>
              <given-names>FG</given-names>
            </name>
            <name name-style="western">
              <surname>Siebert</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Sroczynski</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>de Beaufort</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Bolt</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cibula</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zikan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bjørge</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Colombo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Harbeck</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dudbridge</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Tasse</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Knoppers</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Joly</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Teschendorff</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pashayan</surname>
              <given-names>N</given-names>
            </name>
            <collab>FORECEE (4C) Consortium</collab>
          </person-group>
          <article-title>Epigenome-based cancer risk prediction: rationale, opportunities and challenges</article-title>
          <source>Nat Rev Clin Oncol</source>
          <year>2018</year>
          <month>05</month>
          <volume>15</volume>
          <issue>5</issue>
          <fpage>292</fpage>
          <lpage>309</lpage>
          <pub-id pub-id-type="doi">10.1038/nrclinonc.2018.30</pub-id>
          <pub-id pub-id-type="medline">29485132</pub-id>
          <pub-id pub-id-type="pii">nrclinonc.2018.30</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Risk evaluation for the development of cervical intraepithelial neoplasia: development and validation of risk-scoring schemes</article-title>
          <source>Int J Cancer</source>
          <year>2015</year>
          <month>01</month>
          <day>15</day>
          <volume>136</volume>
          <issue>2</issue>
          <fpage>340</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/ijc.28982"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ijc.28982</pub-id>
          <pub-id pub-id-type="medline">24841989</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teschendorff</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fiegl</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sargent</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuang</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kitchener</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Widschwendter</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Epigenetic variability in cells of normal cytology is associated with the risk of future morphological transformation</article-title>
          <source>Genome Med</source>
          <year>2012</year>
          <month>03</month>
          <day>27</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>24</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://genomemedicine.biomedcentral.com/articles/10.1186/gm323"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/gm323</pub-id>
          <pub-id pub-id-type="medline">22453031</pub-id>
          <pub-id pub-id-type="pii">gm323</pub-id>
          <pub-id pub-id-type="pmcid">PMC3446274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="web">
          <article-title>Machine learning repository</article-title>
          <source>UCI</source>
          <access-date>2021-05-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://archive.ics.uci.edu/ml/index.php">https://archive.ics.uci.edu/ml/index.php</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>SVM and SVM ensembles in breast cancer prediction</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e0161501</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0161501"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0161501</pub-id>
          <pub-id pub-id-type="medline">28060807</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-10440</pub-id>
          <pub-id pub-id-type="pmcid">PMC5217832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Breast cancer prediction system</article-title>
          <source>Procedia Computer Science</source>
          <year>2018</year>
          <volume>132</volume>
          <fpage>371</fpage>
          <lpage>376</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2018.05.197</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mostavi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Convolutional neural network models for cancer type prediction based on gene expression</article-title>
          <source>BMC Med Genomics</source>
          <year>2020</year>
          <month>04</month>
          <day>03</day>
          <volume>13</volume>
          <issue>Suppl 5</issue>
          <fpage>44</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedgenomics.biomedcentral.com/articles/10.1186/s12920-020-0677-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12920-020-0677-2</pub-id>
          <pub-id pub-id-type="medline">32241303</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12920-020-0677-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7119277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>A semi-supervised deep learning method based on stacked sparse auto-encoder for cancer prediction using RNA-seq data</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2018</year>
          <month>11</month>
          <volume>166</volume>
          <fpage>99</fpage>
          <lpage>105</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2018.10.004</pub-id>
          <pub-id pub-id-type="medline">30415723</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(18)30455-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Bing</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Horie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>RankProd combined with genetic algorithm optimized artificial neural network establishes a diagnostic and prognostic prediction model that revealed C1QTNF3 as a biomarker for prostate cancer</article-title>
          <source>EBioMedicine</source>
          <year>2018</year>
          <month>06</month>
          <volume>32</volume>
          <fpage>234</fpage>
          <lpage>244</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-3964(18)30165-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ebiom.2018.05.010</pub-id>
          <pub-id pub-id-type="medline">29861410</pub-id>
          <pub-id pub-id-type="pii">S2352-3964(18)30165-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6021271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Tumor gene expression data classification via sample expansion-based deep learning</article-title>
          <source>Oncotarget</source>
          <year>2017</year>
          <month>12</month>
          <day>12</day>
          <volume>8</volume>
          <issue>65</issue>
          <fpage>109646</fpage>
          <lpage>109660</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.oncotarget.com/lookup/doi/10.18632/oncotarget.22762"/>
          </comment>
          <pub-id pub-id-type="doi">10.18632/oncotarget.22762</pub-id>
          <pub-id pub-id-type="medline">29312636</pub-id>
          <pub-id pub-id-type="pii">22762</pub-id>
          <pub-id pub-id-type="pmcid">PMC5752549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kidd</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Deep Patient: an unsupervised representation to predict the future of patients from the electronic health records</article-title>
          <source>Sci Rep</source>
          <year>2016</year>
          <month>12</month>
          <day>17</day>
          <volume>6</volume>
          <fpage>26094</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/UsJJXQ/OwN0t"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep26094</pub-id>
          <pub-id pub-id-type="medline">27185194</pub-id>
          <pub-id pub-id-type="pii">srep26094</pub-id>
          <pub-id pub-id-type="pmcid">PMC4869115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Duong</surname>
              <given-names>SQ</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Alfreds</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Stearns</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kanov</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sylvester</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Widen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McElhinney</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>XB</given-names>
            </name>
          </person-group>
          <article-title>Prediction of the 1-year risk of incident lung cancer: prospective study using electronic health records from the State of Maine</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>05</month>
          <day>16</day>
          <volume>21</volume>
          <issue>5</issue>
          <fpage>e13260</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/5/e13260/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13260</pub-id>
          <pub-id pub-id-type="medline">31099339</pub-id>
          <pub-id pub-id-type="pii">v21i5e13260</pub-id>
          <pub-id pub-id-type="pmcid">PMC6542253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Burnside</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Breast cancer risk prediction using electronic health records</article-title>
          <year>2017</year>
          <conf-name>IEEE International Conference on Healthcare Informatics</conf-name>
          <conf-date>August 23-36</conf-date>
          <conf-loc>Park City, Utah</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ichi.2017.62</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Muhammad</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Nartowt</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Farrell</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Johung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Pancreatic cancer prediction through an artificial neural network</article-title>
          <source>Front Artif Intell</source>
          <year>2019</year>
          <month>5</month>
          <day>3</day>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.3389/frai.2019.00002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>An early intestinal cancer prediction algorithm based on deep belief network</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>11</month>
          <day>22</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>17418</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-019-54031-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-019-54031-2</pub-id>
          <pub-id pub-id-type="medline">31758076</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-019-54031-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6874645</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pavlidis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pentheroudakis</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Cancer of unknown primary site</article-title>
          <source>Lancet</source>
          <year>2012</year>
          <month>04</month>
          <day>14</day>
          <volume>379</volume>
          <issue>9824</issue>
          <fpage>1428</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(11)61178-1</pub-id>
          <pub-id pub-id-type="medline">22414598</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(11)61178-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Karafiát</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burget</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>?ernocký</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khudanpur</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Recurrent neural network based language model</article-title>
          <year>2010</year>
          <conf-name>Eleventh Annual Conference of the International Speech Communication Association</conf-name>
          <conf-date>September 26-30</conf-date>
          <conf-loc>Makuhari, Japan</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gers</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidhuber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cummins</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Learning to forget: continual prediction with LSTM</article-title>
          <source>Neural Comput</source>
          <year>2000</year>
          <month>10</month>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>2451</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1162/089976600300015015</pub-id>
          <pub-id pub-id-type="medline">11032042</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duke</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Huser</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Schuemie</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Suchard</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>ICK</given-names>
            </name>
            <name name-style="western">
              <surname>Rijnbeek</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>van der Lei</surname>
              <given-names>Johan</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Norén</surname>
              <given-names>G Niklas</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Madigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
          </person-group>
          <article-title>Observational Health Data Sciences and Informatics (OHDSI): opportunities for observational researchers</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2015</year>
          <volume>216</volume>
          <fpage>574</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26262116"/>
          </comment>
          <pub-id pub-id-type="medline">26262116</pub-id>
          <pub-id pub-id-type="pmcid">PMC4815923</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="web">
          <article-title>cancer-prediction-on-fhir-rdf</article-title>
          <source>GitHub</source>
          <access-date>2021-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/fhircat/cancer-prediction-on-fhir-rdf">https://github.com/fhircat/cancer-prediction-on-fhir-rdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
