<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i3e25635</article-id>
      <article-id pub-id-type="pmid">33646127</article-id>
      <article-id pub-id-type="doi">10.2196/25635</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Machine Learning Approach to Predict the Probability of Recurrence of Renal Cell Carcinoma After Surgery: Prediction Model Development Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Xiangzhou</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>HyungMin</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2824-0535</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Sun Jung</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1087-2051</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Park</surname>
            <given-names>So Jin</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3449-7532</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>In Young</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2860-9411</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>Sung-Hoo</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <address>
            <institution>Department of Urology</institution>
            <institution>Seoul St. Mary’s Hospital</institution>
            <institution>College of Medicine, The Catholic University</institution>
            <addr-line>222, Banpo-daero, Seocho-gu</addr-line>
            <addr-line>Seoul</addr-line>
            <country>Republic of Korea</country>
            <phone>82 2 2258 6228</phone>
            <email>toomey@catholic.ac.kr</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1952-4010</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Medical Informatics</institution>
        <institution>College of Medicine</institution>
        <institution>The Catholic University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Biomedicine &#38; Health Sciences</institution>
        <institution>College of Medicine</institution>
        <institution>The Catholic University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Urology</institution>
        <institution>Seoul St. Mary’s Hospital</institution>
        <institution>College of Medicine, The Catholic University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Sung-Hoo Hong <email>toomey@catholic.ac.kr</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>1</day>
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>3</issue>
      <elocation-id>e25635</elocation-id>
      <history>
        <date date-type="received">
          <day>11</day>
          <month>12</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>1</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©HyungMin Kim, Sun Jung Lee, So Jin Park, In Young Choi, Sung-Hoo Hong. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 01.03.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/3/e25635" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Renal cell carcinoma (RCC) has a high recurrence rate of 20% to 30% after nephrectomy for clinically localized disease, and more than 40% of patients eventually die of the disease, making regular monitoring and constant management of utmost importance.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study was to develop an algorithm that predicts the probability of recurrence of RCC within 5 and 10 years of surgery.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Data from 6849 Korean patients with RCC were collected from eight tertiary care hospitals listed in the KOrean Renal Cell Carcinoma (KORCC) web-based database. To predict RCC recurrence, analytical data from 2814 patients were extracted from the database. Eight machine learning algorithms were used to predict the probability of RCC recurrence, and the results were compared.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Within 5 years of surgery, the highest area under the receiver operating characteristic curve (AUROC) was obtained from the naïve Bayes (NB) model, with a value of 0.836. Within 10 years of surgery, the highest AUROC was obtained from the NB model, with a value of 0.784.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>An algorithm was developed that predicts the probability of RCC recurrence within 5 and 10 years using the KORCC database, a large-scale RCC cohort in Korea. It is expected that the developed algorithm will help clinicians manage prognosis and establish customized treatment strategies for patients with RCC after surgery.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>renal cell carcinoma</kwd>
        <kwd>recurrence</kwd>
        <kwd>machine learning</kwd>
        <kwd>naïve Bayes</kwd>
        <kwd>algorithm</kwd>
        <kwd>cancer</kwd>
        <kwd>surgery</kwd>
        <kwd>web-based</kwd>
        <kwd>database</kwd>
        <kwd>prediction</kwd>
        <kwd>probability</kwd>
        <kwd>carcinoma</kwd>
        <kwd>kidney</kwd>
        <kwd>model</kwd>
        <kwd>development</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Renal cell carcinoma (RCC) accounts for 90% of malignant tumors in the kidney and is twice as common in men as in women [<xref ref-type="bibr" rid="ref1">1</xref>]. Kidney cancer, therefore, generally refers to RCC. It is the sixth most frequently diagnosed cancer in men and the 10th most frequently diagnosed cancer in women worldwide [<xref ref-type="bibr" rid="ref2">2</xref>]. According to the cancer statistics from the National Cancer Center, the number of new kidney cancer cases in Korea in 2017 was 5299, accounting for approximately 2.3% of the total of 232,255 cancer cases. Further, the incidence of kidney cancer per 100,000 people has been increasing since 1999 [<xref ref-type="bibr" rid="ref3">3</xref>]. RCC is one of the most lethal types of malignant tumors in urology, with approximately 20% to 30% of patients with RCC suffering from metastatic diseases, and more than 40% of patients eventually die of the disease [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. The main treatment for RCC is radical nephrectomy; for small tumors, partial nephrectomy is performed to preserve kidney function [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>RCC can be completely cured through full surgical resection if there is no evidence of preoperative metastatic disease. However, it has a high recurrence rate of 20% to 30% [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], and approximately 50% of recurrences occur within 2 years [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. RCC recurrence is generally classified as early recurrence or late recurrence based on the 5-year threshold [<xref ref-type="bibr" rid="ref11">11</xref>]. Most recurrences occur during the early recurrence period (within 5 years) [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], whereas approximately 10% occur during the late recurrence period (after 5 years) [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>RCC is generally resistant to radiation and chemotherapy, making treatment of its recurrence difficult [<xref ref-type="bibr" rid="ref4">4</xref>]. Therefore, it is necessary to predict the probability of RCC recurrence so that risk factors can be managed in advance. The Memorial Sloan Kettering Cancer Center (MSKCC) in the United States developed a nomogram that predicts the probability of recurrence within 5 years using the symptoms and histology of 601 patients with kidney cancer who received surgical treatment in 2001 [<xref ref-type="bibr" rid="ref14">14</xref>]. Additionally, in 2005, a nomogram was developed to predict the recurrence probability within 5 years using the pathological stage, Fuhrman nuclear grade, tumor size, necrosis, vascular invasion, and clinical presentation variables of 701 patients with kidney cancer [<xref ref-type="bibr" rid="ref15">15</xref>]. Previous studies have used small-scale RCC cohorts from single institutions, and the data have included censored data, where the values of the observations were only partially known. If censored data are included, they can be applied in the Cox proportional hazards model, a standard statistical technique for modeling censored data, but they are difficult to apply to other machine learning (ML) techniques [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      <p>In this study, we used a multicenter, large-scale RCC cohort collected from eight tertiary care hospitals in Korea; we removed censored data and used only the fully observed data. ML focuses on building new predictive models by performing extensive searches on multiple models and parameters and then performing validation [<xref ref-type="bibr" rid="ref17">17</xref>]. The objective of this study was to develop an algorithm that could predict the recurrence probability of RCC after surgery within 5 and 10 years by applying eight representative ML algorithms to a large-scale Korean RCC cohort. Using the developed algorithm, clinicians can manage postoperative patient outcomes and establish personalized treatment strategies.</p>
    </sec>
    <sec sec-type="materials and methods">
      <title>Methods</title>
      <sec>
        <title>Study Population</title>
        <p>The data used in this study were obtained from a large-scale cohort of Korean patients with RCC assembled from the KOrean Renal Cell Carcinoma (KORCC) web-based database. It consisted of 206 variables, including demographic information such as age, height, and weight, as well as pathological information, including clinical stage, pathological stage, Fuhrman nuclear grade, and survival period [<xref ref-type="bibr" rid="ref18">18</xref>]. The study protocol was approved by the institutional review board of the Catholic University of Korea (IRB No. KC20ZIDI0966). The data of 6849 patients who participated in the KORCC study group as of July 1, 2015, were collected from eight tertiary hospitals.</p>
      </sec>
      <sec>
        <title>Variable Selection and Data Cleansing</title>
        <p>The <italic>t</italic> test for continuous variables and the chi-square test for categorical variables were used to explore variables that significantly affect recurrence. In both tests, variables with missing values were removed to ensure that the data used were complete and without missing values. At a significance level of <italic>P</italic>=.05, we first extracted 31 variables showing significant differences between the recurring and nonrecurring groups. Of the 31 variables extracted, 10 variables that had significant effects on recurrence in actual clinical trials were finally extracted based on the expert advice of a urologist. The final 10 selected variables were gender, age, BMI, smoking, pathological tumor stage, histological type, necrosis, lymphovascular invasion, capsular invasion, and Fuhrman nuclear grade.</p>
        <p>Several studies reported that age ≥60 years, Fuhrman nuclear grade ≥3, and pathological stage ≥pT2 were statistically associated with RCC recurrence [<xref ref-type="bibr" rid="ref19">19</xref>]. In addition, women had better prognoses after surgery than men [<xref ref-type="bibr" rid="ref20">20</xref>], and individuals with higher BMIs showed better prognoses than those with normal or lower BMIs [<xref ref-type="bibr" rid="ref21">21</xref>]. Furthermore, the prognoses of smokers were worse than those of nonsmokers [<xref ref-type="bibr" rid="ref22">22</xref>], and pathological variables such as histological type [<xref ref-type="bibr" rid="ref23">23</xref>], necrosis [<xref ref-type="bibr" rid="ref24">24</xref>], lymphovascular invasion [<xref ref-type="bibr" rid="ref11">11</xref>], and capsular invasion [<xref ref-type="bibr" rid="ref25">25</xref>] were all related to the recurrence of RCC.</p>
        <p>Next, we cleansed the data to present them in a form suitable for analysis. Of the 6849 patients, only 5281 patients who received surgical treatment were included in the analysis. Of those 5281 patients, 13 patients with recurrence after 10 years, 1079 lost to follow-up, and 1375 with missing values in 10 variables were excluded from the analysis. Finally, a subset of 2814 patients with values for 10 variables was available for analysis (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Data generation process for analysis. KORCC: Korean Renal Cell Carcinoma.</p>
          </caption>
          <graphic xlink:href="medinform_v9i3e25635_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Dealing with the Imbalanced Data Set</title>
        <p>One of the most frequent problems in applying ML classification algorithms is data imbalance [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. In the medical field, data asymmetry occurs between normal and abnormal classes because most patients are concentrated in the “normal” class, whereas relatively few—such as patients with cancer—are in the “abnormal” class. In this case, the ML algorithm attempts to improve the performance by predicting normal classes, in which most patients are concentrated, resulting in lower predictability of abnormal classes with small numbers of patients [<xref ref-type="bibr" rid="ref27">27</xref>]. However, from a research perspective, it is more important to predict abnormal classes; hence, it is necessary to deal with the imbalanced data.</p>
        <p>In this study, the synthetic minority oversampling technique (SMOTE) was applied to the training data set to solve the imbalance problem. SMOTE is an oversampling method that is widely used when ML is applied to data with high imbalance [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Before applying SMOTE, the ratio of patients in the recurrence group to patients in the nonrecurrence group in the training set was significantly asymmetrical—approximately 1:10; ML was applied after making the ratio of the two groups equal to 1:1 using SMOTE (<xref ref-type="table" rid="table1">Table 1</xref>). Because the volume of the data set was sufficiently large after SMOTE application, we verified the prediction model using the 20% hold-out validation method with the data partitioning of the training set and test set at 80:20 [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Distribution of data sets before and after synthetic minority oversampling technique application.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="210"/>
            <col width="250"/>
            <col width="0"/>
            <col width="210"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td colspan="3">Training set (n=2251)</td>
                <td colspan="2">Test set (n=563)</td>
              </tr>
              <tr valign="top">
                <td>Recurrence group, n (%)</td>
                <td>Nonrecurrence group, n (%)</td>
                <td colspan="2">Recurrence group, n (%)</td>
                <td>Nonrecurrence group, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Before</td>
                <td>226 (10.04)</td>
                <td>2025 (89.96)</td>
                <td colspan="2">52 (9.24)</td>
                <td>511 (90.76)</td>
              </tr>
              <tr valign="top">
                <td>After</td>
                <td>2025 (50.00)</td>
                <td>2025 (50.00)</td>
                <td colspan="2">52 (9.24)</td>
                <td>511 (90.76)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Statistical Analysis and ML Model Development</title>
        <p>In this study, we compared the performance of the following representative ML classification algorithms: kernel support vector machine (SVM) [<xref ref-type="bibr" rid="ref31">31</xref>], logistic regression [<xref ref-type="bibr" rid="ref32">32</xref>], decision tree [<xref ref-type="bibr" rid="ref33">33</xref>], k-nearest neighbor (KNN) [<xref ref-type="bibr" rid="ref34">34</xref>], naïve Bayes (NB) [<xref ref-type="bibr" rid="ref35">35</xref>], random forest [<xref ref-type="bibr" rid="ref36">36</xref>], AdaBoost [<xref ref-type="bibr" rid="ref36">36</xref>], and gradient boost [<xref ref-type="bibr" rid="ref37">37</xref>]. For each algorithm, we calculated four values: sensitivity, specificity, accuracy, and area under the receiver operating characteristic curve (AUROC). The algorithm with the highest performance was finally selected based on the AUROC value, which is one of the most important indicators for confirming the performance of a classification model [<xref ref-type="bibr" rid="ref38">38</xref>]. We used Python (version 3.7.6) for statistical analysis and algorithm development.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Characteristics and Distribution of Patients</title>
        <p>We compared the patient characteristics and distribution of each variable between the recurrence and nonrecurrence groups (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        <p>The mean age of patients in the recurrence group was higher than that of patients in the nonrecurrence group (58.4 years versus 55.4 years, respectively). The average BMIs of patients in the recurrence and nonrecurrence groups were 23.6 kg/m<sup>2</sup> and 24.7 kg/m<sup>2</sup>, respectively. The results show the same characteristics as those found in studies that have revealed better prognoses for obese patients [<xref ref-type="bibr" rid="ref21">21</xref>]. The proportion of smokers in the recurrence and nonrecurrence groups was 25.5% and 20.1%, respectively. The pathology stage—an important variable in predicting recurrence—showed that the proportion of patients with a pathological stage ≥pT2 was approximately 60.4% (168/278) in the recurrence group and 15.2% (386/2536) in the nonrecurrence group. Approximately 77.7% (216/278) of the patients in the recurrence group and 44.8% (1135/2536) of those in the nonrecurrence group had Fuhrman nuclear grades ≥3; thus, the recurrence group had higher Fuhrman nuclear grades. The distribution of each category of pathological variables is shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Baseline characteristics of patients (N=2814).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="330"/>
            <col width="0"/>
            <col width="290"/>
            <col width="0"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Variable</td>
                <td colspan="2">Recurrence group (n=278)</td>
                <td>Nonrecurrence group (n=2536)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age (years), mean (SD)</td>
                <td colspan="2">58.4 (11.9)</td>
                <td>55.4 (12.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">BMI (kg/m<sup>2</sup>), mean (SD)</td>
                <td colspan="2">23.6 (3.2)</td>
                <td>24.7 (3.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Gender, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">212 (76.3)</td>
                <td colspan="2">1811 (71.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">66 (23.7)</td>
                <td colspan="2">725 (28.6)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Smoking, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nonsmoker</td>
                <td colspan="2">207 (74.5)</td>
                <td colspan="2">2026 (79.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Current smoker</td>
                <td colspan="2">71 (25.5)</td>
                <td colspan="2">510 (20.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Pathological tumor stage, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1a</td>
                <td colspan="2">50 (18.0)</td>
                <td colspan="2">1663 (65.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1b</td>
                <td colspan="2">60 (21.6)</td>
                <td colspan="2">487 (19.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2a</td>
                <td colspan="2">30 (10.8)</td>
                <td colspan="2">106 (4.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2b</td>
                <td colspan="2">12 (4.3)</td>
                <td colspan="2">29 (1.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3a</td>
                <td colspan="2">82 (29.5)</td>
                <td colspan="2">201 (7.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3b</td>
                <td colspan="2">34 (12.2)</td>
                <td colspan="2">36 (1.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3c</td>
                <td colspan="2">1 (0.4)</td>
                <td colspan="2">3 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td colspan="2">9 (3.2)</td>
                <td colspan="2">11 (0.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Histologic type, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clear cell</td>
                <td colspan="2">242 (87.1)</td>
                <td colspan="2">2243 (88.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Papillary</td>
                <td colspan="2">14 (5.0)</td>
                <td colspan="2">44 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chromophobe</td>
                <td colspan="2">4 (1.4)</td>
                <td colspan="2">180 (7.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Collecting duct</td>
                <td colspan="2">5 (1.8)</td>
                <td colspan="2">4 (0.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unclassified</td>
                <td colspan="2">5 (1.8)</td>
                <td colspan="2">15 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Multilocular cystic</td>
                <td colspan="2">0 (0.0)</td>
                <td colspan="2">19 (0.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mixed</td>
                <td colspan="2">6 (2.2)</td>
                <td colspan="2">24 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Xp11.2 translocation</td>
                <td colspan="2">1 (0.4)</td>
                <td colspan="2">3 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clear cell papillary</td>
                <td colspan="2">1 (0.4)</td>
                <td colspan="2">4 (0.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Necrosis, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">143 (51.4)</td>
                <td colspan="2">2272 (89.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Microscopic</td>
                <td colspan="2">30 (10.8)</td>
                <td colspan="2">126 (5.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Macroscopic</td>
                <td colspan="2">105 (37.8)</td>
                <td colspan="2">138 (5.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Lymphovascular invasion, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">200 (71.9)</td>
                <td colspan="2">2436 (96.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td colspan="2">78 (28.1)</td>
                <td colspan="2">100 (3.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Capsular invasion, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">148 (53.2)</td>
                <td colspan="2">2114 (83.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td colspan="2">130 (46.8)</td>
                <td colspan="2">422 (16.6)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Fuhrman nuclear grade, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td colspan="2">5 (1.8)</td>
                <td colspan="2">108 (4.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td colspan="2">57 (20.5)</td>
                <td colspan="2">1293 (51.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td colspan="2">141 (50.7)</td>
                <td colspan="2">1008 (39.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td colspan="2">75 (27.0)</td>
                <td colspan="2">127 (5.0)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Prediction Model Performance</title>
        <p>We trained eight ML algorithms on the training data set and calculated the sensitivity, specificity, accuracy, and AUROC values using the test data set (<xref ref-type="table" rid="table3">Table 3</xref>). The NB algorithm showed higher performance than the other algorithms, with an AUROC of 0.836 within 5 years and 0.784 within 10 years. The NB approach calculates the conditional probability, which is the likelihood that a conclusion will be observed based on the evidence given [<xref ref-type="bibr" rid="ref35">35</xref>]. The NB algorithm is simple and fast [<xref ref-type="bibr" rid="ref39">39</xref>] and has proven effective in text classification and medical diagnosis [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. However, the NB approach has a limitation in that its prediction probability becomes zero when a new value that is not in the training data set is entered; Laplace smoothing is a means of solving this problem [<xref ref-type="bibr" rid="ref42">42</xref>]. The predictive model we developed also had a problem in that the probability value became zero when a new type of data that was not in the training data set was entered; hence, the algorithm was optimized by adjusting the α value—a parameter in Laplace smoothing (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Diagnostic performance of machine learning algorithms for the prediction of renal cell carcinoma recurrence.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="290"/>
            <col width="90"/>
            <col width="80"/>
            <col width="90"/>
            <col width="80"/>
            <col width="90"/>
            <col width="80"/>
            <col width="90"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Algorithm (parameter name) and parameter value (in 5 years, in 10 years)</td>
                <td colspan="2">Sensitivity</td>
                <td colspan="2">Specificity</td>
                <td colspan="2">Accuracy</td>
                <td colspan="2">AUROC<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Kernel SVM<sup>b,c</sup></td>
                <td>0.733</td>
                <td>0.673</td>
                <td>0.805</td>
                <td>0.853</td>
                <td>0.800</td>
                <td>0.837</td>
                <td>0.769</td>
                <td>0.763</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Logistic regression<sup>c</sup></td>
                <td>0.644</td>
                <td>0.692</td>
                <td>0.839</td>
                <td>0.816</td>
                <td>0.823</td>
                <td>0.805</td>
                <td>0.741</td>
                <td>0.754</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Decision tree<sup>c</sup></td>
                <td>0.533</td>
                <td>0.442</td>
                <td>0.866</td>
                <td>0.869</td>
                <td>0.839</td>
                <td>0.829</td>
                <td>0.700</td>
                <td>0.656</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>KNN<sup>d</sup> (n-neighbors)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(100, 100)<sup>c</sup></td>
                <td>0.556</td>
                <td>0.519</td>
                <td>0.905</td>
                <td>0.898</td>
                <td>0.877</td>
                <td>0.863</td>
                <td>0.730</td>
                <td>0.709</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(10, 10)</td>
                <td>0.467</td>
                <td>0.426</td>
                <td>0.947</td>
                <td>0.928</td>
                <td>0.909</td>
                <td>0.881</td>
                <td>0.707</td>
                <td>0.675</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 50)</td>
                <td>0.511</td>
                <td>0.461</td>
                <td>0.931</td>
                <td>0.922</td>
                <td>0.898</td>
                <td>0.879</td>
                <td>0.722</td>
                <td>0.692</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(200, 200)</td>
                <td>0.556</td>
                <td>0.481</td>
                <td>0.899</td>
                <td>0.902</td>
                <td>0.871</td>
                <td>0.863</td>
                <td>0.727</td>
                <td>0.691</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>NB<sup>e</sup> (alpha)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(10, 100)<sup>c</sup></td>
                <td>0.822</td>
                <td>0.731</td>
                <td>0.850</td>
                <td>0.828</td>
                <td>0.848</td>
                <td>0.819</td>
                <td>0.836</td>
                <td>0.784</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Random forest (number of trees</bold>)</td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(5, 5)<sup>c</sup></td>
                <td>0.578</td>
                <td>0.500</td>
                <td>0.858</td>
                <td>0.853</td>
                <td>0.835</td>
                <td>0.821</td>
                <td>0.718</td>
                <td>0.677</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(10, 10)</td>
                <td>0.511</td>
                <td>0.423</td>
                <td>0.866</td>
                <td>0.861</td>
                <td>0.837</td>
                <td>0.821</td>
                <td>0.688</td>
                <td>0.642</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 50)</td>
                <td>0.511</td>
                <td>0.442</td>
                <td>0.875</td>
                <td>0.861</td>
                <td>0.846</td>
                <td>0.822</td>
                <td>0.693</td>
                <td>0.652</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(100, 100)</td>
                <td>0.511</td>
                <td>0.462</td>
                <td>0.864</td>
                <td>0.861</td>
                <td>0.835</td>
                <td>0.824</td>
                <td>0.687</td>
                <td>0.661</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>AdaBoost (number of trees)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 200)<sup>c</sup></td>
                <td>0.733</td>
                <td>0.692</td>
                <td>0.815</td>
                <td>0.810</td>
                <td>0.809</td>
                <td>0.800</td>
                <td>0.774</td>
                <td>0.751</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(10, 10)</td>
                <td>0.600</td>
                <td>0.577</td>
                <td>0.895</td>
                <td>0.845</td>
                <td>0.871</td>
                <td>0.821</td>
                <td>0.747</td>
                <td>0.711</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 50)</td>
                <td>0.733</td>
                <td>0.673</td>
                <td>0.815</td>
                <td>0.824</td>
                <td>0.809</td>
                <td>0.810</td>
                <td>0.774</td>
                <td>0.748</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(100, 100)</td>
                <td>0.711</td>
                <td>0.692</td>
                <td>0.835</td>
                <td>0.802</td>
                <td>0.825</td>
                <td>0.792</td>
                <td>0.773</td>
                <td>0.747</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(200, 200)</td>
                <td>0.711</td>
                <td>0.692</td>
                <td>0.837</td>
                <td>0.810</td>
                <td>0.826</td>
                <td>0.800</td>
                <td>0.774</td>
                <td>0.751</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Gradient boost (number of trees)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 100)<sup>c</sup></td>
                <td>0.688</td>
                <td>0.635</td>
                <td>0.819</td>
                <td>0.826</td>
                <td>0.809</td>
                <td>0.808</td>
                <td>0.754</td>
                <td>0.730</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(10, 10)</td>
                <td>0.756</td>
                <td>0.596</td>
                <td>0.667</td>
                <td>0.849</td>
                <td>0.674</td>
                <td>0.825</td>
                <td>0.711</td>
                <td>0.723</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(50, 50)</td>
                <td>0.688</td>
                <td>0.615</td>
                <td>0.819</td>
                <td>0.826</td>
                <td>0.809</td>
                <td>0.806</td>
                <td>0.754</td>
                <td>0.721</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(100, 100)</td>
                <td>0.555</td>
                <td>0.635</td>
                <td>0.823</td>
                <td>0.826</td>
                <td>0.805</td>
                <td>0.808</td>
                <td>0.711</td>
                <td>0.730</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>(200, 200)</td>
                <td>0.533</td>
                <td>0.558</td>
                <td>0.848</td>
                <td>0.832</td>
                <td>0.823</td>
                <td>0.806</td>
                <td>0.691</td>
                <td>0.695</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Final algorithms selected by adjusting parameters.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>KNN: k-nearest neighbor.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>NB: naïve Bayes.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Performance according to the α value in the naïve Bayes model.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="160"/>
            <col width="100"/>
            <col width="110"/>
            <col width="100"/>
            <col width="110"/>
            <col width="100"/>
            <col width="110"/>
            <col width="100"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">α value</td>
                <td colspan="2">Sensitivity</td>
                <td colspan="2">Specificity</td>
                <td colspan="2">Accuracy</td>
                <td colspan="2">AUROC<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
                <td>5-year</td>
                <td>10-year</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0 (no smoothing)</td>
                <td>0.800</td>
                <td>0.731</td>
                <td>0.848</td>
                <td>0.828</td>
                <td>0.844</td>
                <td>0.819</td>
                <td>0.824</td>
                <td>0.779</td>
              </tr>
              <tr valign="top">
                <td>1</td>
                <td>0.822</td>
                <td>0.731</td>
                <td>0.848</td>
                <td>0.828</td>
                <td>0.846</td>
                <td>0.819</td>
                <td>0.835</td>
                <td>0.779</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>0.822</td>
                <td>0.731</td>
                <td>0.850</td>
                <td>0.834</td>
                <td>0.848</td>
                <td>0.824</td>
                <td>0.836</td>
                <td>0.782</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>0.800</td>
                <td>0.731</td>
                <td>0.850</td>
                <td>0.834</td>
                <td>0.846</td>
                <td>0.824</td>
                <td>0.825</td>
                <td>0.782</td>
              </tr>
              <tr valign="top">
                <td>30</td>
                <td>0.800</td>
                <td>0.731</td>
                <td>0.852</td>
                <td>0.834</td>
                <td>0.848</td>
                <td>0.824</td>
                <td>0.826</td>
                <td>0.782</td>
              </tr>
              <tr valign="top">
                <td>100</td>
                <td>0.800</td>
                <td>0.731</td>
                <td>0.854</td>
                <td>0.840</td>
                <td>0.850</td>
                <td>0.828</td>
                <td>0.827</td>
                <td>0.784</td>
              </tr>
              <tr valign="top">
                <td>200</td>
                <td>0.756</td>
                <td>0.692</td>
                <td>0.860</td>
                <td>0.845</td>
                <td>0.852</td>
                <td>0.831</td>
                <td>0.807</td>
                <td>0.769</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>For predictions within 5 years, the AUROC was found to be 0.836 when α=10, which was the highest performance compared with that before smoothing was applied (α= 0, AUROC 0.824). For predictions within 10 years, the AUROC was 0.784 when α=100, which was the highest performance compared with that before smoothing was applied (α=0, AUROC 0.779). When comparing the area by drawing the ROC curve of the prediction algorithm within 5 and 10 years, the NB curve line was close to the upper left corner, which means that the area for that algorithm was the widest (<xref rid="figure2" ref-type="fig">Figures 2</xref> and <xref rid="figure3" ref-type="fig">3</xref>).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Receiver operating characteristic (ROC) curves of recurrence prediction algorithms within 5 years. KNN: k-nearest neighbor; SVM: support vector machine.</p>
          </caption>
          <graphic xlink:href="medinform_v9i3e25635_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Receiver operating characteristic (ROC) curves of recurrence prediction algorithms within 10 years. KNN: k-nearest neighbor; SVM: support vector machine.</p>
          </caption>
          <graphic xlink:href="medinform_v9i3e25635_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we developed an algorithm to predict the probability of RCC recurrence within 10 years by selecting 10 variables that significantly affect recurrence. The AUROC of the algorithm was 0.84 for models of recurrence within 5 years and 0.79 for models of recurrence within 10 years. Our proposed algorithm achieved better prediction performance than the previously developed 5-year prediction algorithm by MSKCC, which yielded AUROCs of 0.74 [<xref ref-type="bibr" rid="ref14">14</xref>] and 0.82 [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>In the previous studies, 66 recurrences in 601 patients [<xref ref-type="bibr" rid="ref14">14</xref>] and 72 recurrences in 701 patients [<xref ref-type="bibr" rid="ref15">15</xref>] were used to form the data set for analysis. Because the data were collected from a single institution, the scale was small, and the data included censored data. The methods that can be applied to analyze censored data are limited. Therefore, in previous studies, an algorithm was developed using the Cox proportional hazards model—the most representative survival analysis method—and its performance was presented.</p>
        <p>Because the results of previous studies were based on a single institutional analysis, the characteristics of patients in various regions were likely not reflected, meaning biased results may have been obtained. Thus, a data set composed of data from eight institutions in various regions of Korea was used in this study. In our data, 278 out of 2814 patients experienced RCC recurrence, and censored data were not included. We attempted to improve the prediction performance using more diverse and significant variables than those used by the prediction algorithms in previous studies. Finally, we developed a prediction algorithm by applying ML techniques that are typically used in classification tasks. Because we used large-scale data that sufficiently reflect the characteristics of patients with RCC in Korea, the proposed algorithm achieved stable results with high accuracy and low bias.</p>
        <p>To the best of our knowledge, this is the first study to predict the recurrence of RCC within 10 years after surgery using ML techniques. The recurrence of most cancers is typically within 5 years. Because RCC has a late recurrence [<xref ref-type="bibr" rid="ref12">12</xref>], it is vital to predict the late recurrence in advance and establish a personalized treatment strategy for managing the prognosis of patients with RCC. Thus, our study makes an important contribution by accurately predicting the likelihood of late recurrence of RCC.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>We utilized the data of patients with RCC recurrence after 1 to 10 years in the recurrence prediction model within 10 years. However, in several studies, a difference between variables that affect early recurrence and late recurrence was observed [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. Therefore, the prediction models for 1 to 5 years and 5 to 10 years should be distinct from each other and should be constructed using different combinations of variables. However, despite being a large cohort representing the whole of Korea, it was difficult to create a single model, as only 23 cases occurred after 5 to 10 years. Therefore, in this study, we developed a predictive model by integrating both groups within 10 years. Hence, the algorithm for within 10 years seems to have lower performance than the model for within 5 years because of the heterogeneity between the 1- to 5-year recurrence group and the 5- to 10-year recurrence group. We plan to develop additional stable and accurate models to predict late recurrence when data are collected after 5 to 10 years.</p>
        <p>Furthermore, we used large-scale cohort data showing the characteristics of patients with RCC in Korea. Therefore, the algorithm we developed exhibits stable performance when applied to Korean patients with RCC. However, patients with RCC have different demographic and clinical characteristics; hence, the performance may be reduced when applied to different ethnicities [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Using the KORCC database, a large-scale cohort of RCC in Korea, we developed an algorithm to predict the probability of RCC recurrence after surgery using a representative ML technique. Among the eight ML algorithms, the NB algorithm showed the best diagnostic performance in both the 5-year model and the 10-year model in terms of the AUROC. The developed algorithm can help clinicians establish postoperative prognosis management and personalized treatment strategies for patients with RCC.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">KNN</term>
          <def>
            <p>k-nearest neighbor</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">KORCC</term>
          <def>
            <p>KOrean Renal Cell Carcinoma</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MSKCC</term>
          <def>
            <p>Memorial Sloan Kettering Cancer Center</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NB</term>
          <def>
            <p>naïve Bayes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">RCC</term>
          <def>
            <p>renal cell carcinoma</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SMOTE</term>
          <def>
            <p>synthetic minority oversampling technique</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the R&#38;D Performance Creation Promotion Project 2019 of Seoul St Mary's Hospital. We thank the KOrean Renal Cell Carcinoma (KORCC) group for assisting us in analyzing the data.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>HMK contributed to the work as the first author. SJL and SJP contributed to data preparation and discussion. IYC and S-HH equally supervised the entire process as corresponding authors.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choueiri</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Motzer</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Systemic Therapy for Metastatic Renal-Cell Carcinoma</article-title>
          <source>N Engl J Med</source>
          <year>2017</year>
          <month>01</month>
          <day>26</day>
          <volume>376</volume>
          <issue>4</issue>
          <fpage>354</fpage>
          <lpage>366</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmra1601333</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Capitanio</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Bensalah</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bex</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boorjian</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Coleman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gore</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Epidemiology of Renal Cell Carcinoma</article-title>
          <source>European Urology</source>
          <year>2019</year>
          <month>01</month>
          <volume>75</volume>
          <issue>1</issue>
          <fpage>74</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eururo.2018.08.036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Won</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>YR</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Cancer Statistics in Korea: Incidence, Mortality, Survival, and Prevalence in 2017</article-title>
          <source>Cancer Res Treat</source>
          <year>2020</year>
          <month>4</month>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>335</fpage>
          <lpage>350</lpage>
          <pub-id pub-id-type="doi">10.4143/crt.2020.206</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>AI</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Figlin</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Belldegrun</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Surveillance strategies for renal cell carcinoma patients following nephrectomy</article-title>
          <source>Rev Urol</source>
          <year>2006</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16985554"/>
          </comment>
          <pub-id pub-id-type="medline">16985554</pub-id>
          <pub-id pub-id-type="pmcid">PMC1471767</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Samuels</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tiwari</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Ghafoor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feuer</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Thun</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Cancer statistics, 2005</article-title>
          <source>CA Cancer J Clin</source>
          <year>2005</year>
          <volume>55</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=0007-9235&#38;date=2005&#38;volume=55&#38;issue=1&#38;spage=10"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/canjclin.55.1.10</pub-id>
          <pub-id pub-id-type="medline">15661684</pub-id>
          <pub-id pub-id-type="pii">55/1/10</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Janzen</surname>
              <given-names>NK</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Figlin</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Belldegrun</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Surveillance after radical or partial nephrectomy for localized renal cell carcinoma and management of recurrent disease</article-title>
          <source>Urol Clin North Am</source>
          <year>2003</year>
          <month>11</month>
          <volume>30</volume>
          <issue>4</issue>
          <fpage>843</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1016/s0094-0143(03)00056-9</pub-id>
          <pub-id pub-id-type="medline">14680319</pub-id>
          <pub-id pub-id-type="pii">S0094-0143(03)00056-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jang</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Byun</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cheon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SH</given-names>
            </name>
          </person-group>
          <article-title>Oncologic and Functional Outcomes after Partial Nephrectomy Versus Radical Nephrectomy in T1b Renal Cell Carcinoma: A Multicenter, Matched Case-Control Study in Korean Patients</article-title>
          <source>Cancer Res Treat</source>
          <year>2016</year>
          <month>04</month>
          <volume>48</volume>
          <issue>2</issue>
          <fpage>612</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.4143/crt.2014.122"/>
          </comment>
          <pub-id pub-id-type="doi">10.4143/crt.2014.122</pub-id>
          <pub-id pub-id-type="medline">26044158</pub-id>
          <pub-id pub-id-type="pii">crt.2014.122</pub-id>
          <pub-id pub-id-type="pmcid">PMC4843725</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tyson</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Optimal Surveillance Strategies After Surgery for Renal Cell Carcinoma</article-title>
          <source>J Natl Compr Canc Netw</source>
          <year>2017</year>
          <month>06</month>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>835</fpage>
          <lpage>840</lpage>
          <pub-id pub-id-type="doi">10.6004/jnccn.2017.0102</pub-id>
          <pub-id pub-id-type="medline">28596262</pub-id>
          <pub-id pub-id-type="pii">15/6/835</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van der Mijn</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Al Hussein Al Awamlh</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Islam Khan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Posada-Calderon</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Oromendia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fainberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alshak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elahjji</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pierce</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gudas</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nanus</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Molina</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Del Pizzo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Scherr</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Validation of risk factors for recurrence of renal cell carcinoma: Results from a large single-institution series</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>12</issue>
          <fpage>e0226285</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0226285"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0226285</pub-id>
          <pub-id pub-id-type="medline">31815952</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-21440</pub-id>
          <pub-id pub-id-type="pmcid">PMC6901215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Quinlan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Poyet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Perera</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bolton</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrentschuk</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Renal Cell Carcinoma Follow-Up - Is it Time to Abandon Ultrasound?</article-title>
          <source>Curr Urol</source>
          <year>2019</year>
          <month>09</month>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>19</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.karger.com?DOI=10.1159/000499299"/>
          </comment>
          <pub-id pub-id-type="doi">10.1159/000499299</pub-id>
          <pub-id pub-id-type="medline">31579200</pub-id>
          <pub-id pub-id-type="pii">cur-0013-0019</pub-id>
          <pub-id pub-id-type="pmcid">PMC6771069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Acar</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Şanlı</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Surgical Management of Local Recurrences of Renal Cell Carcinoma</article-title>
          <source>Surg Res Pract</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>2394942</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2016/2394942"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2016/2394942</pub-id>
          <pub-id pub-id-type="medline">26925458</pub-id>
          <pub-id pub-id-type="pmcid">PMC4746394</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Baik</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ku</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kwak</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Late recurrence of renal cell carcinoma &#62;5 years after surgery: clinicopathological characteristics and prognosis</article-title>
          <source>BJU Int</source>
          <year>2012</year>
          <month>12</month>
          <volume>110</volume>
          <issue>11 Pt B</issue>
          <fpage>E553</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1464-410X.2012.11246.x</pub-id>
          <pub-id pub-id-type="medline">22578274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kirkali</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Van Poppel</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A critical analysis of surgery for kidney cancer with vena cava invasion</article-title>
          <source>Eur Urol</source>
          <year>2007</year>
          <month>09</month>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>658</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eururo.2007.05.009</pub-id>
          <pub-id pub-id-type="medline">17548146</pub-id>
          <pub-id pub-id-type="pii">S0302-2838(07)00710-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>M W</given-names>
            </name>
            <name name-style="western">
              <surname>Reuter</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Motzer</surname>
              <given-names>R J</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A postoperative prognostic nomogram for renal cell carcinoma</article-title>
          <source>J Urol</source>
          <year>2001</year>
          <month>07</month>
          <volume>166</volume>
          <issue>1</issue>
          <fpage>63</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="medline">11435824</pub-id>
          <pub-id pub-id-type="pii">S0022-5347(05)66077-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorbellini</surname>
              <given-names>Maximiliano</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>Michael W</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>Mark E</given-names>
            </name>
            <name name-style="western">
              <surname>Reuter</surname>
              <given-names>Victor</given-names>
            </name>
            <name name-style="western">
              <surname>Motzer</surname>
              <given-names>Robert</given-names>
            </name>
            <name name-style="western">
              <surname>Goetzl</surname>
              <given-names>Manlio</given-names>
            </name>
            <name name-style="western">
              <surname>McKiernan</surname>
              <given-names>James</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>Paul</given-names>
            </name>
          </person-group>
          <article-title>A postoperative prognostic nomogram predicting recurrence for patients with conventional clear cell renal cell carcinoma</article-title>
          <source>J Urol</source>
          <year>2005</year>
          <month>01</month>
          <volume>173</volume>
          <issue>1</issue>
          <fpage>48</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1097/01.ju.0000148261.19532.2c</pub-id>
          <pub-id pub-id-type="medline">15592023</pub-id>
          <pub-id pub-id-type="pii">S0022-5347(05)60765-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zupan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Demsar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Beck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bratko</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for survival analysis: a case study on recurrence of prostate cancer</article-title>
          <source>Artif Intell Med</source>
          <year>2000</year>
          <month>08</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>59</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1016/s0933-3657(00)00053-1</pub-id>
          <pub-id pub-id-type="medline">11185421</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(00)00053-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ozdas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Varol</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Carnevale</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Romano-Keeler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nian</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Weitkamp</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Medical decision support using machine learning for early detection of late-onset neonatal sepsis</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>326</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24043317"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001854</pub-id>
          <pub-id pub-id-type="medline">24043317</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-001854</pub-id>
          <pub-id pub-id-type="pmcid">PMC3932458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Byun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kook</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HH</given-names>
            </name>
            <name name-style="western">
              <surname>Kwak</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ku</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Jeong</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The establishment of KORCC (KOrean Renal Cell Carcinoma) database</article-title>
          <source>Investig Clin Urol</source>
          <year>2016</year>
          <month>01</month>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>50</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.icurology.org/DOIx.php?id=10.4111/icu.2016.57.1.50"/>
          </comment>
          <pub-id pub-id-type="doi">10.4111/icu.2016.57.1.50</pub-id>
          <pub-id pub-id-type="medline">26966726</pub-id>
          <pub-id pub-id-type="pmcid">PMC4778757</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Son</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>SH</given-names>
            </name>
          </person-group>
          <article-title>Which Patients Should We Follow up beyond 5 Years after Definitive Therapy for Localized Renal Cell Carcinoma?</article-title>
          <source>Cancer Res Treat</source>
          <year>2015</year>
          <month>07</month>
          <volume>47</volume>
          <issue>3</issue>
          <fpage>489</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.4143/crt.2014.013"/>
          </comment>
          <pub-id pub-id-type="doi">10.4143/crt.2014.013</pub-id>
          <pub-id pub-id-type="medline">25622589</pub-id>
          <pub-id pub-id-type="pii">crt.2014.013</pub-id>
          <pub-id pub-id-type="pmcid">PMC4506106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fukushima</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Saito</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yasuda</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cotta</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Master</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Derweesh</surname>
              <given-names>IH</given-names>
            </name>
            <name name-style="western">
              <surname>Fujii</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Female Gender Predicts Favorable Prognosis in Patients With Non-metastatic Clear Cell Renal Cell Carcinoma Undergoing Curative Surgery: Results From the International Marker Consortium for Renal Cancer (INMARC)</article-title>
          <source>Clin Genitourin Cancer</source>
          <year>2020</year>
          <month>04</month>
          <volume>18</volume>
          <issue>2</issue>
          <fpage>111</fpage>
          <lpage>116.e1</lpage>
          <pub-id pub-id-type="doi">10.1016/j.clgc.2019.10.027</pub-id>
          <pub-id pub-id-type="medline">32001181</pub-id>
          <pub-id pub-id-type="pii">S1558-7673(19)30331-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jeong</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Adami</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HM</given-names>
            </name>
          </person-group>
          <article-title>Body mass index and survival in patients with renal cell carcinoma: a clinical-based cohort and meta-analysis</article-title>
          <source>Int J Cancer</source>
          <year>2013</year>
          <month>02</month>
          <day>01</day>
          <volume>132</volume>
          <issue>3</issue>
          <fpage>625</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/ijc.27639"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ijc.27639</pub-id>
          <pub-id pub-id-type="medline">22610826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The impact of smoking on survival in renal cell carcinoma: a systematic review and meta-analysis</article-title>
          <source>Tumour Biol</source>
          <year>2014</year>
          <month>07</month>
          <volume>35</volume>
          <issue>7</issue>
          <fpage>6633</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1007/s13277-014-1862-8</pub-id>
          <pub-id pub-id-type="medline">24699995</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jeong</surname>
              <given-names>IG</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Histologic subtype needs to be considered after partial nephrectomy in patients with pathologic T1a renal cell carcinoma: papillary vs. clear cell renal cell carcinoma</article-title>
          <source>J Cancer Res Clin Oncol</source>
          <year>2017</year>
          <month>09</month>
          <volume>143</volume>
          <issue>9</issue>
          <fpage>1845</fpage>
          <lpage>1851</lpage>
          <pub-id pub-id-type="doi">10.1007/s00432-017-2430-6</pub-id>
          <pub-id pub-id-type="medline">28451753</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00432-017-2430-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abel</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>GO</given-names>
            </name>
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Master</surname>
              <given-names>VA</given-names>
            </name>
          </person-group>
          <article-title>Defining individual recurrence risk following surgery for high risk non-metastatic renal cell carcinoma</article-title>
          <source>J Clin Oncol</source>
          <year>2018</year>
          <month>02</month>
          <day>20</day>
          <volume>36</volume>
          <issue>6_suppl</issue>
          <fpage>664</fpage>
          <lpage>664</lpage>
          <pub-id pub-id-type="doi">10.1200/jco.2018.36.6_suppl.664</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ha</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Byun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kwak</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Renal capsular invasion is a prognostic biomarker in localized clear cell renal cell carcinoma</article-title>
          <source>Sci Rep</source>
          <year>2018</year>
          <month>01</month>
          <day>09</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>202</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-017-18466-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-017-18466-9</pub-id>
          <pub-id pub-id-type="medline">29317731</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-017-18466-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5760639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shamsuddin</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Ralescu</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>Classification with class imbalance problem: A review</article-title>
          <source>Int J Adv Soft Comput Appl</source>
          <year>2015</year>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>176</fpage>
          <lpage>204</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://home.ijasca.com/data/documents/13IJASCA-070301_Pg176-204_Classification-with-class-imbalance-problem_A-Review.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>A learning method for the class imbalance problem with medical data sets</article-title>
          <source>Comput Biol Med</source>
          <year>2010</year>
          <month>05</month>
          <volume>40</volume>
          <issue>5</issue>
          <fpage>509</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2010.03.005</pub-id>
          <pub-id pub-id-type="medline">20347072</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(10)00040-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alghamdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Mallah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Keteyian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brawner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ehrman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sakr</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Predicting diabetes mellitus using SMOTE and ensemble machine learning approach: The Henry Ford ExercIse Testing (FIT) project</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <volume>12</volume>
          <issue>7</issue>
          <fpage>e0179805</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0179805"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0179805</pub-id>
          <pub-id pub-id-type="medline">28738059</pub-id>
          <pub-id pub-id-type="pii">PONE-D-17-07353</pub-id>
          <pub-id pub-id-type="pmcid">PMC5524285</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blagus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lusa</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Joint use of over- and under-sampling techniques and cross-validation for the development and assessment of prediction models</article-title>
          <source>BMC Bioinformatics</source>
          <year>2015</year>
          <month>11</month>
          <day>04</day>
          <volume>16</volume>
          <fpage>363</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-015-0784-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-015-0784-9</pub-id>
          <pub-id pub-id-type="medline">26537827</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-015-0784-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC4634915</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Koprowski</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Skufca</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Machine learning, medical diagnosis, and biomedical engineering research - commentary</article-title>
          <source>Biomed Eng Online</source>
          <year>2014</year>
          <month>07</month>
          <day>05</day>
          <volume>13</volume>
          <fpage>94</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://biomedical-engineering-online.biomedcentral.com/articles/10.1186/1475-925X-13-94"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1475-925X-13-94</pub-id>
          <pub-id pub-id-type="medline">24998888</pub-id>
          <pub-id pub-id-type="pii">1475-925X-13-94</pub-id>
          <pub-id pub-id-type="pmcid">PMC4105825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>SVM and SVM Ensembles in Breast Cancer Prediction</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e0161501</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0161501"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0161501</pub-id>
          <pub-id pub-id-type="medline">28060807</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-10440</pub-id>
          <pub-id pub-id-type="pmcid">PMC5217832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Logistic regression for disease classification using microarray data: model selection in a large p and small n case</article-title>
          <source>Bioinformatics</source>
          <year>2007</year>
          <month>08</month>
          <day>01</day>
          <volume>23</volume>
          <issue>15</issue>
          <fpage>1945</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btm287</pub-id>
          <pub-id pub-id-type="medline">17540680</pub-id>
          <pub-id pub-id-type="pii">btm287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Decision tree methods: applications for classification and prediction</article-title>
          <source>Shanghai Arch Psychiatry</source>
          <year>2015</year>
          <month>04</month>
          <day>25</day>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>130</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26120265"/>
          </comment>
          <pub-id pub-id-type="doi">10.11919/j.issn.1002-0829.215044</pub-id>
          <pub-id pub-id-type="medline">26120265</pub-id>
          <pub-id pub-id-type="pii">sap-27-02-130</pub-id>
          <pub-id pub-id-type="pmcid">PMC4466856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zong</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Efficient kNN classification algorithm for big data</article-title>
          <source>Neurocomputing</source>
          <year>2016</year>
          <month>06</month>
          <volume>195</volume>
          <fpage>143</fpage>
          <lpage>148</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2015.08.112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Subbalakshmi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ramesh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chinna Rao</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Decision Support in Heart Disease Prediction System using Naive Bayes</article-title>
          <source>Indian J Comput Sci Eng</source>
          <year>2011</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>170</fpage>
          <lpage>176</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ijcse.com/docs/IJCSE11-02-02-56.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Paelinckx</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of Random Forest and Adaboost tree-based ensemble classification and spectral band selection for ecotope mapping using airborne hyperspectral imagery</article-title>
          <source>Remote Sensing of Environment</source>
          <year>2008</year>
          <month>6</month>
          <volume>112</volume>
          <issue>6</issue>
          <fpage>2999</fpage>
          <lpage>3011</lpage>
          <pub-id pub-id-type="doi">10.1016/j.rse.2008.02.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Application of eXtreme gradient boosting trees in the construction of credit risk assessment models for financial institutions</article-title>
          <source>Applied Soft Computing</source>
          <year>2018</year>
          <month>12</month>
          <volume>73</volume>
          <fpage>914</fpage>
          <lpage>920</lpage>
          <pub-id pub-id-type="doi">10.1016/j.asoc.2018.09.029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Jin Huang</collab>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using AUC and accuracy in evaluating learning algorithms</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2005</year>
          <month>03</month>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>299</fpage>
          <lpage>310</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2005.50</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rennie</surname>
              <given-names>J.D</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Teevan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Karger</surname>
              <given-names>D.R</given-names>
            </name>
          </person-group>
          <article-title>Tackling the Poor Assumptions of Naive Bayes Text Classifiers Jason</article-title>
          <year>2003</year>
          <conf-name>Proc 20th Int Conf Mach Learn. Published online</conf-name>
          <conf-date>2003</conf-date>
          <conf-loc>Washington DC</conf-loc>
          <fpage>616</fpage>
          <lpage>623</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rish</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>An empirical study of the naive Bayes classifier</article-title>
          <year>2001</year>
          <conf-name>IJCAI 2001 Workshop on empirical methods in artificial intelligence</conf-name>
          <conf-date>2001</conf-date>
          <conf-loc>Seattle, USA</conf-loc>
          <fpage>4863</fpage>
          <lpage>4869</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Jayram</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Rish</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Recognizing end-user transactions in performance management</article-title>
          <year>2000</year>
          <conf-name>Proceedings of the Seventeenth National Conference on Artificial Intelligence and Twelfth Conference on on Innovative Applications of Artificial Intelligence</conf-name>
          <conf-date>2000</conf-date>
          <conf-loc>Austin, Texas, USA</conf-loc>
          <fpage>596</fpage>
          <lpage>602</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cherian</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bindu</surname>
              <given-names>M.S</given-names>
            </name>
          </person-group>
          <article-title>Heart Disease Prediction Using Naïve Bayes Algorithm and Laplace Smoothing Technique</article-title>
          <source>Int J Comput Sci Trends Technol</source>
          <year>2017</year>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>68</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href=" http://www.ijcstjournal.org/volume-5/issue-2/IJCST-V5I2P13.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adamy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>KT</given-names>
            </name>
            <name name-style="western">
              <surname>Chade</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Costaras</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kaag</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Motzer</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Clinical characteristics and outcomes of patients with recurrence 5 years after nephrectomy for localized renal cell carcinoma</article-title>
          <source>J Urol</source>
          <year>2011</year>
          <month>02</month>
          <volume>185</volume>
          <issue>2</issue>
          <fpage>433</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.juro.2010.09.100</pub-id>
          <pub-id pub-id-type="medline">21167521</pub-id>
          <pub-id pub-id-type="pii">S0022-5347(10)04758-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Shuch</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Linehan</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Devesa</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Racial disparity in renal cell carcinoma patient survival according to demographic and clinical characteristics</article-title>
          <source>Cancer</source>
          <year>2013</year>
          <month>01</month>
          <day>15</day>
          <volume>119</volume>
          <issue>2</issue>
          <fpage>388</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/cncr.27690"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cncr.27690</pub-id>
          <pub-id pub-id-type="medline">23147245</pub-id>
          <pub-id pub-id-type="pmcid">PMC3538913</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olshan</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Purdue</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Rathmell</surname>
              <given-names>WK</given-names>
            </name>
          </person-group>
          <article-title>Racial difference in histologic subtype of renal cell carcinoma</article-title>
          <source>Cancer Med</source>
          <year>2013</year>
          <month>10</month>
          <volume>2</volume>
          <issue>5</issue>
          <fpage>744</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/cam4.110"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cam4.110</pub-id>
          <pub-id pub-id-type="medline">24403240</pub-id>
          <pub-id pub-id-type="pmcid">PMC3892806</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
