<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i10e21798</article-id>
      <article-id pub-id-type="pmid">33084589</article-id>
      <article-id pub-id-type="doi">10.2196/21798</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>AutoScore: A Machine Learning–Based Automatic Clinical Score Generator and Its Application to Mortality Prediction Using Electronic Health Records</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Jinfeng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adly</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adly</surname>
            <given-names>Afnan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Xie</surname>
            <given-names>Feng</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0215-667X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Chakraborty</surname>
            <given-names>Bibhas</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7366-0478</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ong</surname>
            <given-names>Marcus Eng Hock</given-names>
          </name>
          <degrees>MBBS, MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7874-7612</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Goldstein</surname>
            <given-names>Benjamin Alan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5261-3632</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Nan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Programme in Health Services and Systems Research</institution>
            <institution>Duke-NUS Medical School</institution>
            <addr-line>8 College Road</addr-line>
            <addr-line>Singapore, 169857</addr-line>
            <country>Singapore</country>
            <phone>65 65767372</phone>
            <email>liu.nan@duke-nus.edu.sg</email>
          </address>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3610-4883</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Programme in Health Services and Systems Research</institution>
        <institution>Duke-NUS Medical School</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Statistics and Applied Probability</institution>
        <institution>National University of Singapore</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Biostatistics &#38; Bioinformatics</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Emergency Medicine</institution>
        <institution>Singapore General Hospital</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Health Services Research Centre</institution>
        <institution>Singapore Health Services</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Institute of Data Science</institution>
        <institution>National University of Singapore</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Nan Liu <email>liu.nan@duke-nus.edu.sg</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>21</day>
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>10</issue>
      <elocation-id>e21798</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>25</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>27</day>
          <month>7</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Feng Xie, Bibhas Chakraborty, Marcus Eng Hock Ong, Benjamin Alan Goldstein, Nan Liu. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 21.10.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2020/10/e21798/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Risk scores can be useful in clinical risk stratification and accurate allocations of medical resources, helping health providers improve patient care. Point-based scores are more understandable and explainable than other complex models and are now widely used in clinical decision making. However, the development of the risk scoring model is nontrivial and has not yet been systematically presented, with few studies investigating methods of clinical score generation using electronic health records.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to propose AutoScore, a machine learning–based automatic clinical score generator consisting of 6 modules for developing interpretable point-based scores. Future users can employ the AutoScore framework to create clinical scores effortlessly in various clinical applications.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We proposed the AutoScore framework comprising 6 modules that included variable ranking, variable transformation, score derivation, model selection, score fine-tuning, and model evaluation. To demonstrate the performance of AutoScore, we used data from the Beth Israel Deaconess Medical Center to build a scoring model for mortality prediction and then compared the data with other baseline models using the receiver operating characteristic analysis. A software package in R 3.5.3 (R Foundation) was also developed to demonstrate the implementation of AutoScore.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Implemented on the data set with 44,918 individual admission episodes of intensive care, the AutoScore-created scoring models performed comparably well as other standard methods (ie, logistic regression, stepwise regression, least absolute shrinkage and selection operator, and random forest) in terms of predictive accuracy and model calibration but required fewer predictors and presented high interpretability and accessibility. The nine-variable, AutoScore-created, point-based scoring model achieved an area under the curve (AUC) of 0.780 (95% CI 0.764-0.798), whereas the model of logistic regression with 24 variables had an AUC of 0.778 (95% CI 0.760-0.795). Moreover, the AutoScore framework also drives the clinical research continuum and automation with its integration of all necessary modules.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We developed an easy-to-use, machine learning–based automatic clinical score generator, AutoScore; systematically presented its structure; and demonstrated its superiority (predictive performance and interpretability) over other conventional methods using a benchmark database. AutoScore will emerge as a potential scoring tool in various medical applications.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>clinical decision making</kwd>
        <kwd>machine learning</kwd>
        <kwd>prognosis</kwd>
        <kwd>clinical prediction rule</kwd>
        <kwd>electronic health records</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Risk-scoring models are sparse models with integer point scores, which are used pervasively throughout medicine for risk stratification [<xref ref-type="bibr" rid="ref1">1</xref>]. Risk-scoring models have been developed to determine which patients are at most risk of adverse events or worsening health conditions. Accurate identification of patients at risk can be useful for appropriate allocations of medical resources [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Risk-scoring models have been traditionally developed in 1 of 2 ways: through expert opinions or consensus, such as the Sepsis-related Organ Failure Assessment [<xref ref-type="bibr" rid="ref5">5</xref>] score and the National Early Warning Score [<xref ref-type="bibr" rid="ref6">6</xref>], and through the analysis of conventional cohort studies, such as the History, Electrocardiogram, Age, Risk factors, and Troponin score [<xref ref-type="bibr" rid="ref7">7</xref>] and the Charlson Comorbidity Index [<xref ref-type="bibr" rid="ref8">8</xref>]. Both approaches are labor-intensive and are not easy to update over time, which reveals the need for a flexible and fast approach to deriving risk-scoring models.</p>
      <p>At present, the increasing popularity of electronic health records (EHRs) [<xref ref-type="bibr" rid="ref9">9</xref>] creates an opportunity to take advantage of its growing quantity and diversity of data for creating novel risk models with both domain expert–curated approaches and advanced machine learning solutions. Although EHRs are rich data sources, numerous data items are collected in a nonsystematic way related to clinical use, leading to a bevy of irrelevant and redundant information. Therefore, variable selection, the process of determining a subset of relevant and discriminative variables for model development [<xref ref-type="bibr" rid="ref10">10</xref>], plays an essential role in the development of a risk model. In risk models, more variables do not necessarily lead to better performance [<xref ref-type="bibr" rid="ref11">11</xref>]. Moreover, irrelevant and redundant information can adversely affect model interpretability and accessibility, especially in the clinical context. A typical but time-intensive approach for variable selection uses domain knowledge obtained from literature reviews and consultation with experts; however, the literature may not always be available, and the expert’s interpretation could be biased. Analytic approaches exist, such as stepwise methods (eg, forward and backward) and regularization (eg, the least absolute shrinkage and selection operator [LASSO]). However, when data sets are large enough, these methods do not often achieve a sparse solution. Thus, there is an unmet need to develop a parsimonious model with easy access to validation in the context of EHRs.</p>
      <p>Model complexity not only affects model efficiency but also impacts transparency and interpretability [<xref ref-type="bibr" rid="ref12">12</xref>] in clinical practice. Although machine learning often has greater predictive accuracy than simpler models, it has 2 key shortcomings. First, machine learning is harder to implement in real-world settings where many EHR systems can only accept regression or point-based approaches [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Second, it has lower explainability due to its black box nature. Clinicians may not accept black box models due to various reasons such as lack of external validation and the involvement of complex mathematical computation. Sullivan et al [<xref ref-type="bibr" rid="ref15">15</xref>] suggested that the multivariable mathematical models are relatively complex, and the calculation should be simplified to allow application of models even without a computer, making these complex statistical models useful to clinical practitioners. Churpek et al [<xref ref-type="bibr" rid="ref4">4</xref>] also suggested that a simple and parsimonious model can be applied at the bedside and easily validated across different hospitals. Thus, point-based scoring models are more favored in the medical context and are still widely used in clinical decision making. However, as developing a scoring model is nontrivial, there is a need to automate the process of score generation to cater to the increasingly diversified patient population and large-scale EHRs.</p>
      <p>To tackle these problems and systematically present a robust and generic method for developing risk-scoring models, we proposed AutoScore, an automatic clinical score generator, by combining machine learning and regression modeling. The proposed AutoScore framework can automatically generate parsimonious sparse-score risk models (ie, risk scores), which can be easily implemented and validated in clinical practice. In this study, we implemented our proposed AutoScore framework to build an actual risk-scoring model for inpatient mortality prediction.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>AutoScore for Automatic Score Generation</title>
        <p>In this paper, we proposed the AutoScore, a novel framework for automating the development of a clinical scoring model for predefined outcomes and systematically presented its structure. AutoScore consists of 6 modules: variable ranking with machine learning, variable transformation, score derivation, model selection, domain knowledge–based score fine-tuning, and model evaluation. In our demonstration, the full data set was randomly split into a nonoverlapping training set (70%), validation set (10%; if downstream parameter tuning is needed), and test set (20%). The training set was used to derive the scores. The validation set was used for intermediate performance evaluation and parameter selection, which were elaborated in Module 4. The test set acted as an unseen data set and was used to generate the metrics of final model performance in Module 6. In real-world clinical applications, users can set up training, validation, and test sets accordingly instead of random splitting. <xref rid="figure1" ref-type="fig">Figure 1</xref> illustrates the framework of AutoScore, and details of its 6 modules are elaborated as follows.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of the AutoScore framework. ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e21798_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Module 1: Variable Ranking With Machine Learning</title>
          <p>The first step in the AutoScore framework is variable ranking. We use random forest (RF) [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], an ensemble machine learning algorithm, to identify the top-ranking predictors for subsequent score generation. RF consists of multiple tree-structured classifiers (decision trees). Each of the trees is grown using a classification and regression tree [<xref ref-type="bibr" rid="ref18">18</xref>] to maximum size, without pruning, and trained on a bootstrap sample and a random subset of all variables. Each tree sees only a subset of variables and part of the observations by resampling, which guarantees that the trees are decorrelated and, therefore, less prone to overfitting [<xref ref-type="bibr" rid="ref19">19</xref>]. For the classification task, the Gini index is used to determine the optimal split. For each node <inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>

          
          
          of a decision tree <inline-graphic xlink:href="medinform_v8i10e21798_fig7.png" mimetype="image" xlink:type="simple"/>, the Gini index can be defined as follows:</p>
          <graphic xlink:href="medinform_v8i10e21798_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>where <italic>p<sub>r</sub></italic> refers to the fraction of training samples from the <italic>r</italic><sup>th</sup> class in the node<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/> and 
         
       <italic> R=2</italic> in binary classification. In addition to outcome prediction, RF ranks variables on the basis of their predictive importance [<xref ref-type="bibr" rid="ref20">20</xref>]. The mean decrease impurity is the measurement of variable importance, calculated by the total decrease in node impurities from splitting on the variable. The importance measurement of a variable <italic>X<sub>m</sub></italic> is the weighted total of impurity decreases<italic>
          
          w(<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>)ΔGini(<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>)</italic> for all nodes <inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/><italic>,</italic> averaged over all trees [<xref ref-type="bibr" rid="ref21">21</xref>]:</p>
          <graphic xlink:href="medinform_v8i10e21798_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>Where <italic>w(<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>)</italic> is the proportional weight <italic>N<sub><inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/></sub>/ N</italic> of samples reaching node <inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>, v(<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>) is the variable in the split of the node <inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>, <italic>ΔGini(<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>)</italic> is the total impurity decrease after the split of the node<inline-graphic xlink:href="medinform_v8i10e21798_fig6.png" mimetype="image" xlink:type="simple"/>; and <italic>N<sub><inline-graphic xlink:href="medinform_v8i10e21798_fig7.png" mimetype="image" xlink:type="simple"/></sub></italic>
    
    
    
    
    
    is the number of decision trees in the RF model. 
    
    
    
    Then, <italic>Imp(X<sub>m</sub>)</italic>
    
    

    
    will be used for variable ranking for each <italic>X<sub>m</sub></italic>.
    

    
    
    </p>
          <p>An advantage of using RF as the variable ranker over other methods such as backward stepwise regression or LASSO is that as a nonparametric model, RF is able to rank variables on the basis of their nonlinear and heterogeneous effects. In the AutoScore framework, the final list of variables is decided by the ranking, in addition to the parameter <italic>m</italic>, which is the number of final selected variables. Parameter <italic>m</italic> can be chosen case by case in accordance with clinical preference, expert knowledge, or the needs of real-world applications. Moreover, an optimized number of variables can be determined through grid search and performance validation, which will be elaborated in Module 4.</p>
        </sec>
        <sec>
          <title>Module 2: Variable Transformation</title>
          <p>After variable selection, all selected variables are preprocessed for variable transformation, that is, continuous variables are converted into categorical variables. Creating categorical variables allows for the modeling of nonlinear effects. In AutoScore, the maximum number of categories (eg, <italic>K</italic>=5) for each variable is predefined to ensure its usability. For a categorical variable, if the original number of categories (<italic>L</italic>) exceeds the predefined maximum number (ie, <italic>L</italic>&#62;<italic>K</italic>), several excess categories need to be combined, and <italic>K'</italic> is the number of categories of the transformed variable where <italic>K'</italic>≤<italic>L</italic>. Unlike categorical variables, to develop a point-based score, continuous variables will be stratified by specific quantiles into <italic>K</italic> categories (in our study, <italic>K</italic>=5). We set the quantiles as 0%, <italic>k</italic><sub>1</sub>%, <italic>k</italic><sub>2</sub>%, <italic>k</italic><sub>3</sub>%, <italic>k</italic><sub>4</sub>%, and 100%. The values of <italic>k</italic><sub>1</sub>, <italic>k</italic><sub>2</sub>, <italic>k</italic><sub>3</sub>, and <italic>k</italic><sub>4</sub> can be set in accordance with the distributions of the variables. In our study, we set the default values as follows: <italic>k</italic><sub>1</sub>=5, <italic>k</italic><sub>2</sub>=20, <italic>k</italic><sub>3</sub>=80, and <italic>k</italic><sub>4</sub>=95, which were appropriate for most variables (such as common vital signs and laboratory test results), especially those with normal or near-normal distributions.</p>
        </sec>
        <sec>
          <title>Module 3: Score Derivation by Weighting and Normalization</title>
          <p>With the selected and transformed variables, we created a risk score to predict the outcome, in which each category of an individual variable is weighted and given an integer point. As the default setting, we used logistic regression for score weighting, with which the points can be easily interpreted.</p>
          <graphic xlink:href="medinform_v8i10e21798_fig20.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>Where <italic>β<sub>0</sub></italic> is the intercept, <italic>β<sub>1</sub></italic>. . . <italic>β<sub>m</sub></italic> are the coefficients for each category, <italic>X<sub>1</sub></italic>. . . <italic>X<sub>m</sub></italic> are the predictive variables, and <italic>Y</italic> is the binary outcome.</p>
          <p>Multivariable logistic regression is performed to determine regression coefficients. On the basis of the results, the category of each variable with the lowest <italic>β</italic> coefficient is set as the reference. Next, multivariable logistic regression is performed again with adjusted reference categories to ensure that there are no negative coefficients. Subsequently, all coefficients <italic>β</italic> obtained from the second-round logistic regression are divided by the lowest <italic>β</italic> of all variables to ensure that all of the points are larger than one, that is, 
          <italic>
          β<sub>new</sub> = β/β<sub>lowest</sub></italic>. The final weighted points for each category were rounded as <italic>
          
          β<sub>score</sub> = round(β<sub>new</sub>)</italic>. 
          
          
          
          
          With <italic>β<sub>score</sub></italic>, we can obtain a scoring table where each category of a variable is given certain points. The total score is computed by summing up all points. To satisfy the need for specific clinical applications, we can set the ceiling value for the total score and normalize the score breakdowns, divided by a common denominator.</p>
        </sec>
        <sec>
          <title>Module 4: Model Selection and Parameter Determination</title>
          <p>The number of variables (<italic>m</italic>) is a critical parameter for controlling model complexity in the scoring model. A model is considered parsimonious when it is both sparse (using the least number of variables possible) and possesses a good prediction accuracy. To cope with the trade-off between accuracy and complexity, different parameter <italic>m</italic> will be examined on the validation set and a parsimony plot (ie, model performance vs complexity) will be plotted, to which the user can refer for deciding the trade-off in deriving the risk scores. The best parameter <italic>m</italic> is determined when <italic>m</italic> continues to increment and the prediction performance is no longer improving significantly, as shown in the parsimony plot. After confirming the parameter <italic>m</italic>, the final list of variables will be determined on the basis of the ranking obtained from Module 1. Modules 2 and 3 will be reimplemented to generate the initial scoring model.</p>
        </sec>
        <sec>
          <title>Module 5: Fine-Tuning Cutoff Points in the Variable Transformation</title>
          <p>Domain knowledge is essential in guiding risk model development. For continuous variables, the variable transformation (Module 2) is a data-driven process, in which domain knowledge is not integrated. In this module, the automatically generated cutoff values for each continuous variable can be fine-tuned by combining, rounding, and adjusting according to the standard clinical norm. The fine-tuning process endows the final risk scores with orderliness, professionality, and acceptability. After adjusting the cutoffs to convert continuous variables into categorical variables, Modules 2 and 3 will be implemented again to create an updated score table.</p>
        </sec>
        <sec>
          <title>Module 6: Predictive Performance Evaluation</title>
          <p>The performance of the score is evaluated on the basis of the receiver operating characteristic (ROC) analysis. The intermediate evaluation based on the validation set provides information for model optimization (eg, Modules 4 and 5). For the final model evaluation based on the unseen test set, the area under the ROC curve (AUC) acts as the primary metric. In addition, sensitivity, specificity, positive predictive value (PPV), and negative predictive value (NPV) are calculated under the optimal cutoffs, defined as the points nearest to the upper-left corner of the ROC curves. Performance metrics under different cutoffs are also compared to evaluate the predictive performance. In the demonstration, we included cutoffs, by which the sensitivity or specificity could reach about 95% to satisfy certain needs in clinical settings.</p>
        </sec>
      </sec>
      <sec>
        <title>Software Package</title>
        <p>We have introduced all the 6 major modules of the AutoScore framework, with which clinical risk scores can be developed using specific patient cohorts and outcomes. We further created the AutoScore software suite [<xref ref-type="bibr" rid="ref22">22</xref>] (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendices 1</xref> and <xref ref-type="supplementary-material" rid="app2">2</xref>) under the R 3.5.3 (R Foundation) programming environment to demonstrate its capability and to facilitate its implementation and validation in other applications. Given a new data set, the AutoScore tool can be conveniently implemented to generate a point-based clinical scoring model to predict the outcome, with the minimum manual processes for data processing, parameter tuning, and model fine-tuning.</p>
      </sec>
      <sec>
        <title>Clinical Study Design</title>
        <p>We conducted a retrospective analysis of data from the Beth Israel Deaconess Medical Center (BIDMC) to demonstrate the usability of our proposed AutoScore framework. BIDMC is a teaching hospital at the Harvard Medical School in Boston. It has 673 inpatient beds and receives about 55,000 emergency department visits annually. We aimed to implement AutoScore to automatically generate point-based scores for risk prediction of inpatient mortality and compared AutoScore-created scoring models with several baseline models.</p>
        <sec>
          <title>Data Collection and Cohort</title>
          <p>The BIDMC data set was obtained from the Medical Information Mart for Intensive Care III [<xref ref-type="bibr" rid="ref23">23</xref>] database compiled by the Massachusetts Institute of Technology Laboratory for Computational Physiology. A total of 58,976 BIDMC admission encounters from 2001 to 2012 were recorded in this database. All inpatient encounters for which the patient aged 18 to 90 years were included in our study cohort. The admission episodes during which patients died within 24 hours after the intensive care unit (ICU) admission or missed more than 50% of the features were excluded. A flowchart of cohort formation is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Flowchart of the study cohort formation. BIDMC: Beth Israel Deaconess Medical Center.</p>
            </caption>
            <graphic xlink:href="medinform_v8i10e21798_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Variables and Clinical Outcome</title>
          <p>The primary outcome in this study was inpatient mortality, defined as deaths that occurred during the hospital stay. In the BIDMC data set, we extracted patients’ first-day variables during their ICU stay. We previously demonstrated that demographic features, vital signs, and laboratory tests were highly related to inpatient mortality [<xref ref-type="bibr" rid="ref24">24</xref>]. Similar results were also reported in other studies [<xref ref-type="bibr" rid="ref25">25</xref>]. Thus, the predictor variables included age, sex, race, type of insurance, heart rate (beats/min), respiration rate (breaths/min), peripheral capillary oxygen saturation (SpO<sub>2</sub>; %), diastolic blood pressure (mm Hg), systolic blood pressure (mm Hg), mean arterial pressure (MAP; mm Hg), temperature (°C), bicarbonate (mmol/L), creatinine (μmol/L), potassium (mmol/L), sodium (mmol/L), hemoglobin (g/dL), glucose (mg/dL), blood urea nitrogen (BUN; mg/dL), platelet (thousand per microliter), lactate (mmol/L), anion gap (mEq/L), hematocrit (%), chloride (mEq/L), and white blood cells (thousand per microliter). As there were multiple sets of vital signs or laboratory data collected in the ICU, the mean values were used in this study.</p>
        </sec>
        <sec>
          <title>Baseline Models Versus AutoScore</title>
          <p>To evaluate the performance of AutoScore, we compared it with several standard predictive models. The first model was built with logistic regression by using all available variables from the training data set without variable selection. The second model was built using stepwise multivariable logistic regression [<xref ref-type="bibr" rid="ref26">26</xref>]. It built a regression model with variable selection using the Akaike information criterion (AIC). Backward selection began with all the variables and removed the least significant one at each step following the declined AIC until none met the criterion. It penalized models with a large number of variables for a simple and parsimonious model. The third baseline model was built with LASSO [<xref ref-type="bibr" rid="ref27">27</xref>], which is another popular method used in clinical modeling. It is a regression-based method that performs regularization for variable selection to improve both the predictive accuracy and interpretability of the statistical model. Its regularization rate was optimized through 10-fold cross-validation in our study. The last two baseline models were built using RF. We created both a full RF model using all available variables and an RF model using the AutoScore-selected variables. The parameters were selected according to the suggestions in previous literature [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>], where <italic>ntree</italic>=100 and <italic>mtry</italic>=<italic>m</italic><sup>1/2</sup> (<italic>ntree</italic>: the number of trees grown; <italic>mtry</italic>: the number of variables randomly sampled as candidates at each split).</p>
        </sec>
      </sec>
      <sec>
        <title>Statistical Analysis and Model Evaluation</title>
        <p>Data were analyzed using R 3.5.3 (R Foundation). The baseline characteristics of the data set are described. In the descriptive summaries, frequencies and percentages were reported for categorical variables, whereas means and SDs were reported for continuous variables. We compared patients with and without inpatient mortality using a two-tailed Student <italic>t</italic> test for continuous variables and the χ<sup>2</sup> test for categorical variables. During the analysis, values of vital signs or laboratory tests were considered as outliers if they were beyond the normal range on the basis of domain knowledge. All detected outliers were set as missing values, which were subsequently imputed with the median values that were computed from the training set.</p>
        <p>We compared the AutoScore-created scoring model with several baseline models to evaluate their predictive accuracy and interpretability. The test set was used to generate the metrics of model performance, and its bootstrapped samples were applied to calculate 95% CIs. Predictive accuracy was compared on the basis of ROC analysis and AUC values. Model interpretability was assessed by its complexity (eg, the number of variables included and the level of model nonlinearity) and its inherent explainability of the internal interaction. Model calibration was evaluated using the calibration belt plot test [<xref ref-type="bibr" rid="ref30">30</xref>]. In addition, the distribution and observed mortality rate for each aggregated score were plotted for displaying its discriminative power.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Baseline Characteristics of the Study Cohort</title>
        <p>In this study, a total of 44,918 individual ICU admission episodes from the BIDMC data set were selected (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Of all eligible episodes, 8.8% (3958/44,918) of the episodes had an outcome, that is, inpatient mortality. Summary baseline characteristics are shown in <xref ref-type="table" rid="table1">Table 1</xref>, and the distributions of other clinical continuous variables are shown in <xref ref-type="table" rid="table2">Table 2</xref>. In this cohort, the mean age was 62.5 (SD 16.5) years, 57.4% (25,788/44,918) were male, 84.9% (38,138/44,918) admissions were emergent, and the ethnic compositions were complex (31,889/44,918, 71.0% White; 4399/44,918, 9.8% African; 1625/44,918, 3.6% Hispanic; 1034/44,918, 2.3% Asian; and 5971/44,918, 13.3% others or unknown). We noticed that patients were admitted into different ICUs, which included Coronary Care Unit (CCU), Cardiac Surgery Recovery Unit (CSRU), Medical Intensive Care Unit (MICU), Surgical Intensive Care Unit (SICU), and Trauma Surgical Intensive Care Unit (TSICU). The average length of stay for all admission episodes was 4.19 (SD 6.11) days. Compared with the patients who survived to discharge, patients who died in hospitals were older, had a higher chance of emergency admission, had a longer length of stay, and a higher probability of being admitted to the MICU and paying by Medicare.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Description of the study cohort (N=44,918).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="230"/>
            <col width="220"/>
            <col width="220"/>
            <col width="220"/>
            <col width="0"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Variables</td>
                <td>All episodes (N=44,918)</td>
                <td>Live discharged (n=40,960)</td>
                <td>Inpatient mortality (n=3958)</td>
                <td colspan="2"><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>62.5 (16.5)</td>
                <td>62.0 (16.6)</td>
                <td>68.5 (14.7)</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Gender, n (</bold>
                  <bold>%)</bold>
                </td>
                <td>.04</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>25,788 (57.4)</td>
                <td>23,578 (57.6)</td>
                <td>2210 (55.8)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>19,130 (42.6)</td>
                <td>17,382 (42.4)</td>
                <td>1748 (44.2)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Admission</bold>
                  <bold>type, n (%)</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Emergency</td>
                <td>38,138 (84.9)</td>
                <td>34,339 (83.8)</td>
                <td>3799 (96.0)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Elective</td>
                <td>6780 (15.1)</td>
                <td>6621 (16.2)</td>
                <td>159 (4.0)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Ethnicity, n</bold>
                  <bold>(%)</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>31,889 (71.0)</td>
                <td>29,148 (71.2)</td>
                <td>2741 (69.3)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic</td>
                <td>1625 (3.6)</td>
                <td>1539 (3.8)</td>
                <td>86 (2.2)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>1034 (2.3)</td>
                <td>933 (2.3)</td>
                <td>101 (2.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>African</td>
                <td>4399 (9.8)</td>
                <td>4110 (10.0)</td>
                <td>289 (7.3)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Others or unknown</td>
                <td>5971 (13.3)</td>
                <td>5230 (12.8)</td>
                <td>741 (18.7)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Insurance, n</bold>
                  <bold>(%)</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Government</td>
                <td>1326 (3.0)</td>
                <td>1258 (3.1)</td>
                <td>68 (1.7)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medicaid</td>
                <td>4176 (9.3)</td>
                <td>3896 (9.5)</td>
                <td>280 (7.1)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medicare</td>
                <td>23,878 (53.2)</td>
                <td>21,283 (52.0)</td>
                <td>2595 (65.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Private</td>
                <td>15,031 (33.5)</td>
                <td>14,063 (34.3)</td>
                <td>968 (24.5)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Self-pay</td>
                <td>507 (1.1)</td>
                <td>460 (1.1)</td>
                <td>47 (1.2)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>ICU<sup>a</sup></bold>
                  <bold>type, n</bold>
                  <bold>(%)</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>CCU<sup>b</sup></td>
                <td>6445 (14.3)</td>
                <td>5907 (14.4)</td>
                <td>538 (13.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>CSRU<sup>c</sup></td>
                <td>8284 (18.4)</td>
                <td>8031 (19.6)</td>
                <td>253 (6.4)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MICU<sup>d</sup></td>
                <td>17,490 (38.9)</td>
                <td>15,420 (37.6)</td>
                <td>2070 (52.3)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SICU<sup>e</sup></td>
                <td>7320 (16.3)</td>
                <td>6649 (16.2)</td>
                <td>671 (17.0)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TSICU<sup>f</sup></td>
                <td>5379 (12.0)</td>
                <td>4953 (12.1)</td>
                <td>426 (10.8)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="2">Length of stay (days), mean (SD)</td>
                <td>4.19 (6.11)</td>
                <td>3.87 (5.75)</td>
                <td>7.57 (8.36)</td>
                <td colspan="2">&#60;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>ICU: intensive care unit.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>CCU: coronary care unit.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>CSRU: cardiac surgery recovery unit.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>MICU: medical intensive care unit.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>SICU: surgical intensive care unit.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>TSICU: trauma surgical intensive care unit.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Distribution of clinical variables in the study cohort.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="700"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Variables</td>
                <td>Values, median (IQR)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age (years)</td>
                <td>64.4 (51.9-75.9)</td>
              </tr>
              <tr valign="top">
                <td>Heart rate (beats/min)</td>
                <td>84.4 (74.5- 95.2)</td>
              </tr>
              <tr valign="top">
                <td>Systolic blood pressure (mm Hg)</td>
                <td>116.7 (107.1-129.5)</td>
              </tr>
              <tr valign="top">
                <td>Diastolic blood pressure (mm Hg)</td>
                <td>60 (53.7-67.4)</td>
              </tr>
              <tr valign="top">
                <td>Mean arterial pressure (mm Hg)</td>
                <td>76.9 (70.7-84.9)</td>
              </tr>
              <tr valign="top">
                <td>Respiration rate (breaths/min)</td>
                <td>18.0 (15.9-20.6)</td>
              </tr>
              <tr valign="top">
                <td>Temperature (°C)</td>
                <td>36.8 (36.5-37.2)</td>
              </tr>
              <tr valign="top">
                <td>Peripheral capillary oxygen saturation (SpO<sub>2</sub>; %)</td>
                <td>97.6 (96.2-98.7)</td>
              </tr>
              <tr valign="top">
                <td>Glucose (mg/dL)</td>
                <td>129.0 (111.3-154.3)</td>
              </tr>
              <tr valign="top">
                <td>Anion gap (mEq/L)</td>
                <td>13.5 (12-16)</td>
              </tr>
              <tr valign="top">
                <td>Bicarbonate (mmol/L)</td>
                <td>24.0 (21.5-26.5)</td>
              </tr>
              <tr valign="top">
                <td>Creatinine (μmol/L)</td>
                <td>0.95 (0.7-1.4)</td>
              </tr>
              <tr valign="top">
                <td>Chloride (mEq/L)</td>
                <td>105 (101.5-108)</td>
              </tr>
              <tr valign="top">
                <td>Lactate (mmol/L)</td>
                <td>1.8 (1.7-2.0)</td>
              </tr>
              <tr valign="top">
                <td>Hemoglobin (g/dL)</td>
                <td>10.9 (9.6-12.3)</td>
              </tr>
              <tr valign="top">
                <td>Hematocrit (%)</td>
                <td>32.3 (28.8-36.4)</td>
              </tr>
              <tr valign="top">
                <td>Platelet (thousand per microliter)</td>
                <td>208.5 (153.5-276.5)</td>
              </tr>
              <tr valign="top">
                <td>Potassium (mmol/L)</td>
                <td>4.2 (3.8-4.5)</td>
              </tr>
              <tr valign="top">
                <td>Blood urea nitrogen (mg/dL)</td>
                <td>18.0 (12.5-29.5)</td>
              </tr>
              <tr valign="top">
                <td>Sodium (mmol/L)</td>
                <td>138.5 (136-140.5)</td>
              </tr>
              <tr valign="top">
                <td>White blood cells (thousand per microliter)</td>
                <td>10.7 (8.0-14.3)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparison of Selected Variables</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> depicts the comparison of selected variables in the final model with different methods. The stepwise regression selected 22 variables, whereas the LASSO algorithm selected 17 variables after parameter tuning by 10-fold cross-validation. AutoScore selected a predefined number (<italic>m</italic>) of variables, and parameter <italic>m</italic> was optimized by a parsimony plot (ie, model performance vs complexity) on the validation set. As shown in part (a) of <xref rid="figure3" ref-type="fig">Figure 3</xref>, we chose 9 variables as the parsimonious choice as it achieved a good balance in the parsimony plot. When more variables were added to the scoring model, the performance was not markedly improved. Nine and 12 were selected as the number of variables in the demonstration. Users can also choose another parameter <italic>m</italic> if other restrictions or clinical preferences exist in real-life application scenarios. As seen from <xref ref-type="table" rid="table3">Table 3</xref>, the selected variables of AutoScore mostly coincided with those of the stepwise regression and LASSO. Notably, AutoScore generated a more parsimonious selection and sparse solution, catering to user preference and practical need.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Selected variables by AutoScore and other baseline models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="270"/>
            <col width="150"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Variables</td>
                <td>Stepwise</td>
                <td>LASSO</td>
                <td>AutoScore (<italic>m</italic>=12)<sup>a</sup></td>
                <td>AutoScore (<italic>m</italic>=9)<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age (years)</td>
                <td>✔<sup>b</sup></td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Ethnicity</td>
                <td>✔</td>
                <td>✔</td>
                <td>—<sup>c</sup></td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Insurance</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Gender</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Heart rate</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Systolic blood pressure</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Diastolic blood pressure</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Mean arterial pressure</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Respiration rate</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Temperature</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>SpO<sub>2</sub><sup>d</sup></td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Glucose</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Anion gap</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Bicarbonate</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Creatinine</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Chloride</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Hematocrit</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Hemoglobin</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Lactate</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Platelet</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Potassium</td>
                <td>✔</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>BUN<sup>e</sup></td>
                <td>✔</td>
                <td>—</td>
                <td>✔</td>
                <td>✔</td>
              </tr>
              <tr valign="top">
                <td>Sodium</td>
                <td>—</td>
                <td>✔</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>White blood cells</td>
                <td>✔</td>
                <td>—</td>
                <td>✔</td>
                <td>—</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Parameter <italic>m</italic> is the number of variables included in the AutoScore model.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Tick mark represents that this variable is included by the corresponding method.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>This variable is not included by the corresponding method.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>SpO<sub>2</sub>: peripheral capillary oxygen saturation.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>BUN: blood urea nitrogen.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Model performance versus complexity for the implementation of the AutoScore on (a) the validation set and (b) the test set. The area under the curve reflects the discrimination performance, whereas the number of variables represents the complexity of the model.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e21798_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Scoring Models by AutoScore</title>
        <p>The nine-variable AutoScore-created scoring model of inpatient mortality for the BIDMC data set is tabulated in <xref ref-type="table" rid="table4">Table 4</xref>. Age, heart rate, respiration rate, systolic blood pressure, SpO<sub>2</sub>, temperature, BUN, platelet, and lactate levels were selected into the final models. The final score summed up from 9 breakdowns ranged from 0 to 162. We used the test set to evaluate the property of this nine-variable point-based score. Part (a) of <xref rid="figure4" ref-type="fig">Figure 4</xref> depicts the distribution of episodes at different score intervals, which is a near-normal distribution. Most patients had a risk score from 21 to 50, and very few patients had scores under 10 or above 80. As seen in part (b) of <xref rid="figure4" ref-type="fig">Figure 4</xref>, the observed mortality rate increased as our risk scores grew on the test set. The observed mortality rate was about 10% for a score of 50, whereas the mortality rate was over 50% for scores above 90. In terms of different breakdowns of the score, when age was lower than 30 years, its corresponding risk was the lowest; when it was higher than 85 years, the risk was the highest. Similarly, when the reported temperature was between 36.5°C and 37.5°C, the corresponding risk was the lowest, and when it was lower than 36°C, the risk was the highest. In addition, some variables, such as age, SpO<sub>2</sub>, and BUN, have larger score values, indicating more significant contributions to the risk.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>A nine-variable AutoScore-created scoring model for inpatient mortality.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="570"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Variables and interval<sup>a</sup></td>
                <td>Point</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Age (years)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;30</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>30-48</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>48-78</td>
                <td>14</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>78-85</td>
                <td>22</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥85</td>
                <td>24</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Heart rate (beats/min)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;62</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>62-72</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>72-98</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>98-112</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥112</td>
                <td>13</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Respiration rate (breaths/min)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;12</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>12-16</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>16-22</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥22</td>
                <td>12</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Systolic blood pressure (mm Hg)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;90</td>
                <td>15</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>90-100</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>100-130</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>130-150</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥150</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Temperature (°C)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;36</td>
                <td>12</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>36-36.5</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>36.5-37.5</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>37.5-38</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥38</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>SpO<sub>2</sub><sup>b</sup>(%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;85</td>
                <td>25</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>85-90</td>
                <td>13</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>90-95</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥95</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Platelet (thousand per microliter)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;80</td>
                <td>17</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>80-150</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>150-300</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>300-450</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥450</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Blood urea nitrogen (mg/dL)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;7.5</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>7.5-12</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>12-35</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>35-70</td>
                <td>19</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥70</td>
                <td>23</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Lactate (mmol/L)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;1</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1-2.5</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2.5-4</td>
                <td>8</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥4</td>
                <td>21</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Interval (q<sub>1</sub>-q<sub>2</sub>) represents q<sub>1</sub> ≤<italic>x</italic>&#60;q<sub>2</sub>.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>SpO<sub>2</sub>: peripheral capillary oxygen saturation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>(a) Number of cases and (b) observed mortality rate, versus different score intervals obtained by the nine-variable AutoScore model.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e21798_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Comparison of Predictive Performance</title>
        <p>The results of mortality prediction, as assessed by the ROC analysis on the unseen test set, are reported in <xref ref-type="table" rid="table5">Table 5</xref>. The scoring models generated by AutoScore showed promising discriminatory capability in predicting inpatient mortality. The 12-variable AutoScore model achieved an AUC of 0.789 (95% CI 0.773-0.802) with a sensitivity of 71.7% (95% CI 68.5%-74.7%) and a specificity of 71.7% (95% CI 70.7%-72.7%) under the optimal threshold (score=130). When we compromised on accuracy for parsimony, the nine-variable AutoScore model achieved a slightly lower AUC of 0.780 (95% CI 0.764-0.798) with a sensitivity of 63.7% (95% CI 60.3%-67.1%) and a specificity of 77.2% (95% CI 76.3%-78.2%) under the optimal threshold (score=48). In comparison, the performance of the 24-variable full logistic regression, the 22-variable stepwise regression, the 17-variable LASSO models, the nine-variable RF model, and the 24-variable full RF model achieved AUC values of 0.778 (95% CI 0.760-0.795), 0.778 (95% CI 0.760-0.795), 0.772 (95% CI 0.755-0.790), 0.785 (95% CI 0.768-0.801), and 0.809 (95% CI 0.794-0.825), respectively. <xref ref-type="table" rid="table5">Table 5</xref> presents the performance metrics that were calculated under different score cutoffs. Besides the optimal cutoffs, other cutoffs by which the sensitivity or specificity could reach approximately 95% were also evaluated.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Performance of the AutoScore and other baseline models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="190"/>
            <col width="50"/>
            <col width="90"/>
            <col width="180"/>
            <col width="180"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Methods, AUC<sup>a</sup> (95% CI)</td>
                <td>
                  <italic>m</italic>
                  <sup>b</sup>
                </td>
                <td>Threshold</td>
                <td>Sensitivity (%), 95% CI</td>
                <td>Specificity (%), 95% CI</td>
                <td>PPV<sup>c</sup> (%), 95% CI</td>
                <td>NPV<sup>d</sup> (%), 95% CI</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>AutoScore (<italic>m</italic><sup>b</sup>=9)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.780 (0.764-0.798)</td>
                <td>9</td>
                <td>48<sup>e</sup></td>
                <td>63.7 (60.3-67.1)</td>
                <td>77.2 (76.3-78.2)</td>
                <td>20.9 (19.8-22.0)</td>
                <td>95.8 (95.4-96.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A<sup>f</sup></td>
                <td>N/A</td>
                <td>30<sup>g</sup></td>
                <td>95.7 (94.3-97.2)</td>
                <td>25.1 (24.2-26.0)</td>
                <td>10.8 (10.6-10.9)</td>
                <td>98.4 (97.9-98.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>64<sup>h</sup></td>
                <td>28.8 (25.7-32.0)</td>
                <td>95.5 (95.0-95.9)</td>
                <td>37.6 (34.2-41.0)</td>
                <td>93.4 (93.2-93.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>AutoScore (<italic>m</italic><sup>b</sup>=12)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.789 (0.773-0.802)</td>
                <td>12</td>
                <td>130<sup>e</sup></td>
                <td>71.7 (68.5-74.7)</td>
                <td>71.7 (70.7-72.7)</td>
                <td>19.3 (18.4-20.1)</td>
                <td>96.4 (96.0-96.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>95<sup>g</sup></td>
                <td>93.7 (92.0-95.3)</td>
                <td>34.5 (33.4-35.6)</td>
                <td>11.9 (11.6-12.1)</td>
                <td>98.3 (97.8-98.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>180<sup>h</sup></td>
                <td>32.0 (28.8-35.3)</td>
                <td>94.8 (94.3-95.2)</td>
                <td>36.6 (33.4-39.9)</td>
                <td>93.7 (93.4-94.0)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Full logistic regression</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.778 (0.760-0.795)</td>
                <td>24</td>
                <td>0.085<sup>e</sup></td>
                <td>68.6 (65.4-71.8)</td>
                <td>72.8 (71.8-73.7)</td>
                <td>19.2 (18.3-20.1)</td>
                <td>96.1 (95.7-96.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.028<sup>g</sup></td>
                <td>95.2 (93.5-96.6)</td>
                <td>25.3 (24.4-26.3)</td>
                <td>10.7 (10.5-10.9)</td>
                <td>98.3 (97.7-98.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.24<sup>h</sup></td>
                <td>27.9 (24.5-31.3)</td>
                <td>95.1 (94.7-95.6)</td>
                <td>35.0 (31.7-38.6)</td>
                <td>93.3 (93.0-93.6)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Stepwise regression</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.778 (0.760-0.795)</td>
                <td>22</td>
                <td>0.096<sup>e</sup></td>
                <td>65.0 (61.6-68.5)</td>
                <td>76.9 (76.0-77.8)</td>
                <td>21.0 (19.9-22.0)</td>
                <td>95.9 (95.5-96.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.028<sup>g</sup></td>
                <td>95.1 (93.5-96.5)</td>
                <td>25.0 (24.1-26.1)</td>
                <td>10.7 (10.5-10.9)</td>
                <td>98.2 (97.6-98.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.24<sup>h</sup></td>
                <td>28.4 (25.1-31.7)</td>
                <td>95.2 (94.7-95.6)</td>
                <td>35.7 (32.2-39.1)</td>
                <td>93.4 (93.1-93.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>LASSO<sup>i</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.772 (0.755-0.790)</td>
                <td>17</td>
                <td>–2.47<sup>e</sup></td>
                <td>73.4 (70.2-76.4)</td>
                <td>68.1 (67.1-69.2)</td>
                <td>17.8 (17.0-18.6)</td>
                <td>96.4 (96.0-96.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>–3.34<sup>g</sup></td>
                <td>95.2 (93.7-96.5)</td>
                <td>25.1 (24.1-26.1)</td>
                <td>10.7 (10.5-10.9)</td>
                <td>98.2 (97.7-98.7)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>–1.27<sup>h</sup></td>
                <td>28.4 (25.2-31.8)</td>
                <td>95.2 (94.7-95.7)</td>
                <td>36.0 (32.6-39.5)</td>
                <td>93.4 (93.1-93.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Random forest(<italic>m</italic><sup>b</sup>=9)<sup>j</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.785 (0.768-0.801)</td>
                <td>9</td>
                <td>0.085<sup>e</sup></td>
                <td>74.2 (71.1-77.0)</td>
                <td>69.4 (68.4-70.4)</td>
                <td>18.6 (17.8-19.4)</td>
                <td>96.6 (96.2-97.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.015<sup>g</sup></td>
                <td>94.2 (92.5-95.7)</td>
                <td>30.1 (29.1-31.1)</td>
                <td>11.3 (11.1-11.5)</td>
                <td>98.2 (97.7-98.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.3<sup>h</sup></td>
                <td>30.5 (27.4-34.0)</td>
                <td>94.8 (94.4-95.3)</td>
                <td>35.7 (32.5-39.0)</td>
                <td>93.5 (93.3-93.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Full random forest</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0.809 (0.794-0.825)</td>
                <td>24</td>
                <td>0.115<sup>e</sup></td>
                <td>73.1 (69.9-76.2)</td>
                <td>75.4 (74.5-76.3)</td>
                <td>21.9 (20.9-22.9)</td>
                <td>96.8 (96.4-97.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.025<sup>g</sup></td>
                <td>94.4 (92.8-95.9)</td>
                <td>37.9 (36.9-38.9)</td>
                <td>12.5 (12.3-12.8)</td>
                <td>98.6 (98.2-99.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.285<sup>h</sup></td>
                <td>34.1 (30.6-37.5)</td>
                <td>95.1 (94.6-95.5)</td>
                <td>39.4 (36.2-42.9)</td>
                <td>93.9 (93.6-94.2)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>AUC: the area under the ROC curve.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Number of variables in the model.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>PPV: positive predictive value.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>NPV: negative predictive value.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>Optimal cutoff values, defined as the points nearest to the upper-left corner of the ROC curves.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>Cutoff values by which the sensitivity could reach about 95%.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>Cutoff values by which the specificity could reach about 95%.</p>
            </fn>
            <fn id="table5fn9">
              <p><sup>i</sup>LASSO: least absolute shrinkage and selection operator.</p>
            </fn>
            <fn id="table5fn10">
              <p><sup>j</sup>AutoScore-based variable selection was implemented beforehand, where the same set of variables were selected as the AutoScore (<italic>m</italic>=9).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>As illustrated in <xref rid="figure5" ref-type="fig">Figure 5</xref>, our nine-variable AutoScore model remained well calibrated, and all parts of the calibration belt showed a good fit under both 80% and 95% CIs. In comparison, other models displayed varying degrees of underestimation or overestimation. Two RF models performed the worst in the calibration test, followed by the stepwise regression and LASSO models. On the contrary, the AutoScore and logistic regression perform relatively well in terms of model calibration.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Calibration belts (at 80% and 95% confidence levels) for (a) a nine-variable AutoScore-created model, (b) a 12-variable AutoScore-created model, (c) a full logistic regression model, (d) a stepwise regression model, (e) the LASSO model, (f) a nine-variable random forest model, and (g) a full random forest model.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e21798_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we developed AutoScore, a framework of automatic clinical score creation, and tested it in a large clinical data set. The scoring models generated by AutoScore were comparable with other standard methods (ie, logistic regression, stepwise regression, LASSO, RF model) in terms of predictive performance and model calibration. More importantly, the AutoScore-created scoring models showed superiority in interpretability and accessibility, as they were point-based scores with fewer variables used. In clinical practice, point-based scores have the advantage of easy implementation and, thus, can be widely utilized and validated in different circumstances and health care settings. The novelty of our study was the development of a generic, scalable, and robust methodology for automatically generating a point-based scoring model, which has been demonstrated by deriving an actual scoring model of inpatient mortality with a large benchmark EHR data set.</p>
        <p>The proposed AutoScore has several advantages in creating risk prediction models. First, the machine learning–based variable ranking or selection can efficiently filter out redundant information. The importance of including variable selection in the development of predictive models has been demonstrated in many studies. In a study by Zhao et al [<xref ref-type="bibr" rid="ref31">31</xref>], variable selection removed noninformative variables from the clinical predictive model. Bagherzadeh-Khiabani et al [<xref ref-type="bibr" rid="ref32">32</xref>] demonstrated that the use of variable selection could improve the performance of clinical prediction models. Sanchez-Pinto et al [<xref ref-type="bibr" rid="ref11">11</xref>] also provided evidence of modern tree-based methods of variable selection with better parsimony in large data sets. Liu et al [<xref ref-type="bibr" rid="ref33">33</xref>] demonstrated that machine learning–based variable selection was promising for discovering a few relevant and significant variables in the prediction of adverse cardiac events. Second, the module of variable transformation could improve the fit of models. Several studies [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>] have reported U-shaped nonlinearity between continuous variables and health-related outcomes. According to expert opinion, the value of vital signs or laboratory tests is usually considered as an abnormal value if it is beyond a healthy normal range. Besides, the categorization of continuous variables remains to be a dominant practice in epidemiological studies [<xref ref-type="bibr" rid="ref36">36</xref>]. Discretizing features requires a smaller memory footprint, simplifies model interpretation, and can be applied directly by a human expert in routine care [<xref ref-type="bibr" rid="ref37">37</xref>]. In addition, categorization creates a natural way to handle missing values, where the missing values can be treated as an extra category. This missing-indicator method has the appealing property that all available information can be used in the analyses [<xref ref-type="bibr" rid="ref38">38</xref>]. Third, we use a parsimony plot (model performance vs complexity) to determine the appropriate number of variables (<italic>m</italic>), balancing the trade-off between performance and sparsity [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. We value the model parsimony as the most desirable characteristic, as there is a real-world cost associated with mapping numerous variables, maintaining complex algorithms, and replicating it in different settings. This parsimony-driven parameter tuning process can be performed in an independent validation set (ie, 10% randomly selected samples from the entire data set in this study), as shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. It also shows a similar trend on the basis of the unseen test set, illustrating the effectiveness and consistency of parsimony-driven tuning for determining the number of necessary variables.</p>
        <p>Furthermore, the scoring models created by the AutoScore framework are interpretable and clinically practical. The output of AutoScore is a point-based scoring model, based on addition, subtraction, and multiplication of a few sparse numbers, facilitating quick stratification without the need for a computing system. Doctors can easily understand how risk models make predictions in a transparent manner. Although numerous machine learning models, such as neural networks [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>] and ensemble learning models [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>], have been developed to complement traditional regression models, most of them are black boxes that do not explain their predictions in a way that humans can understand. In our study, the nine-variable RF model was performed as accurately as our nine-variable AutoScore (AUC 0.785 vs 0.780). However, it is challenging to explain the prediction made by the RF model, which consists of 100 different decision trees together. The lack of transparency of predictive models could lead to severe consequences in patient care. Vellido [<xref ref-type="bibr" rid="ref12">12</xref>] suggested that these models with low explainability are unlikely to become part of routine clinical and health care practice as providing care is a highly sensitive task. Rudin [<xref ref-type="bibr" rid="ref45">45</xref>] also suggested designing models that are inherently interpretable rather than explaining black box models and doubted the blind belief in the myth of the accuracy-interpretability trade-off.</p>
      </sec>
      <sec>
        <title>Relationship With Previous Work</title>
        <p>Researchers have previously created several scoring models for predicting mortality, such as the Modified Early Warning Score [<xref ref-type="bibr" rid="ref46">46</xref>], the VitalPAC Early Warning Score [<xref ref-type="bibr" rid="ref47">47</xref>], and the Acute Physiology And Chronic Health Evaluation [<xref ref-type="bibr" rid="ref48">48</xref>], mainly utilizing vital signs to predict mortality for hospitalized patients. However, they were designed by hand subjectively from expert opinions and domain knowledge, which hindered their generalization and dynamic evolution. Considering the disparate EHR systems among various health care settings, these scoring models may not work well because of the diversity among routinely collected information. As the characteristics of the population evolve, the adjustment and updating of risk scores are needed, which are time-consuming and inflexible [<xref ref-type="bibr" rid="ref49">49</xref>]. In contrast, our AutoScore framework is adaptive and flexible; it can generate scoring models automatically, given an evolving EHR system. A user-friendly and easy-to-use R package of AutoScore [<xref ref-type="bibr" rid="ref22">22</xref>] has been developed to facilitate the creation of scoring systems in diverse contexts, satisfying the increasing need for the development of specific predictive scores in various health care settings.</p>
        <p>Similar to our AutoScore framework, Zhang et al [<xref ref-type="bibr" rid="ref50">50</xref>] presented a tutorial on building a scoring system from several steps. However, the tutorial did not integrate some vital components such as variable ranking or selection and several crucial tuning processes inherently into the process of score generation. In comparison, our AutoScore framework includes all essential modules, driving the clinical continuum of 6 modules and realizing the automation. Although users may benefit from the built-in automation of AutoScore for developing a clinical score, domain knowledge is equally important in building the scoring models, as suggested in many studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. In AutoScore, domain knowledge can be involved in 2 ways: (1) the variable can be preselected by expert opinion before implementing the AutoScore and (2) domain knowledge can be used to fine-tune the risk scores and determine clinically valid cutoff values in variable transformation.</p>
      </sec>
      <sec>
        <title>Future Research and Limitations</title>
        <p>Although the proposed AutoScore framework is comprehensively and systematically presented, improvements can still be made. Each module of the AutoScore can be improved using advanced algorithms and enhanced methodologies. For example, in the module of variable ranking, various established machine learning methods can potentially be integrated into the AutoScore framework. In variable transformation, the means of categorization may be customized according to its distribution, provided a handful of clinical variables such as SpO<sub>2</sub> that may not be subject to a near-normal distribution. Furthermore, the application of AutoScore is not limited to its application to large-scale EHR data [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]. AutoScore can be readily implemented in small-scale observational cohort studies. Beyond health care applications, AutoScore is potentially applicable to other high-stakes prediction applications such as criminal justice and finance, where highly interpretable predictive models are needed.</p>
        <p>This study has several limitations. First, the data set used in this study was on the basis of EHR data with routinely collected vital and laboratory test variables. Some relevant variables were not available in this analysis. For example, health utilization, such as intubation and resuscitation, has been proven to be predictive of overall mortality. Second, given the limitation in data availability, the clinical scores built with AutoScore in this study are not perfect for real-world implementation. This clinical study was primarily designed to demonstrate the effectiveness of the AutoScore framework in building risk scores. Third, this was a retrospective analysis. To further prove its clinical practicability, prospective validation of the scoring model is needed. Finally, this was the initial development of AutoScore, where only selected methods were integrated into the framework, leaving opportunities for further development with more sophisticated and state-of-the-art algorithms.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We developed an easy-to-use, machine learning–based automatic clinical score generator, AutoScore, to conveniently build scoring models and demonstrated its usability with a clinical study on mortality prediction. Using a benchmark data set, we showed that the scoring models derived with the AutoScore framework achieved satisfactory predictive performance and proved its superiority over several conventional methods for risk model development. The AutoScore framework integrates both the advantage of machine learning in strong discriminative power and the merit of point-based scores in its excellent accessibility and interpretability. Our proposed AutoScore framework can be readily used to generate clinical scores in various medical applications, such as early warning systems and risk predictions of mortality, hospital readmissions, and adverse cardiac events. In the future, advanced machine learning algorithms and methodologies could improve individual modules of AutoScore and provide AutoScore with more robust predictive capability or broader applicability in various types of data.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>AutoScore R package (version 0.1).</p>
        <media xlink:href="medinform_v8i10e21798_app1.zip" xlink:title="ZIP File  (Zip Archive), 943 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>AutoScore R package (version 0.1) source codes.</p>
        <media xlink:href="medinform_v8i10e21798_app2.zip" xlink:title="ZIP File  (Zip Archive), 687 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AIC</term>
          <def>
            <p>Akaike information criterion</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BIDMC</term>
          <def>
            <p>Beth Israel Deaconess Medical Center</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BUN</term>
          <def>
            <p>blood urea nitrogen</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CCU</term>
          <def>
            <p>coronary care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CSRU</term>
          <def>
            <p>cardiac surgery recovery unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ICU</term>
          <def>
            <p>intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LASSO</term>
          <def>
            <p>least absolute shrinkage and selection operator</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">MAP</term>
          <def>
            <p>mean arterial pressure</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MICU</term>
          <def>
            <p>medical intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">SICU</term>
          <def>
            <p>surgical intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">TSICU</term>
          <def>
            <p>trauma surgical intensive care unit</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the Singapore National Medical Research Council under the PULSES Center Grant.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>NL conceived and supervised the study. FX and NL developed the AutoScore algorithm and wrote the first draft of the manuscript. FX analyzed the data. FX, BC, MO, BG, and NL made substantial contributions to the interpretation of results, algorithm improvement, and critical revision of the manuscript. All authors have read and approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Chiovaro</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>O'Neil</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kansagara</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Quiñones</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Motu'apuaka</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Slatore</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Early warning system scores for clinical deterioration in hospitalized patients: a systematic review</article-title>
          <source>Ann Am Thorac Soc</source>
          <year>2014</year>
          <month>11</month>
          <volume>11</volume>
          <issue>9</issue>
          <fpage>1454</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1513/AnnalsATS.201403-102OC</pub-id>
          <pub-id pub-id-type="medline">25296111</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Prytherch</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Meredith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Featherstone</surname>
              <given-names>PI</given-names>
            </name>
          </person-group>
          <article-title>The ability of the national early warning score (NEWS) to discriminate patients at risk of early cardiac arrest, unanticipated intensive care unit admission, and death</article-title>
          <source>Resuscitation</source>
          <year>2013</year>
          <month>04</month>
          <volume>84</volume>
          <issue>4</issue>
          <fpage>465</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1016/j.resuscitation.2012.12.016</pub-id>
          <pub-id pub-id-type="medline">23295778</pub-id>
          <pub-id pub-id-type="pii">S0300-9572(13)00002-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brady</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>de Souza</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The HEART score: a guide to its application in the emergency department</article-title>
          <source>Turk J Emerg Med</source>
          <year>2018</year>
          <month>06</month>
          <volume>18</volume>
          <issue>2</issue>
          <fpage>47</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2452-2473(18)30111-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.tjem.2018.04.004</pub-id>
          <pub-id pub-id-type="medline">29922729</pub-id>
          <pub-id pub-id-type="pii">S2452-2473(18)30111-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6005932</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Churpek</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Yuen</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Meltzer</surname>
              <given-names>DO</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Edelson</surname>
              <given-names>DP</given-names>
            </name>
          </person-group>
          <article-title>Derivation of a cardiac arrest prediction model using ward vital signs</article-title>
          <source>Crit Care Med</source>
          <year>2012</year>
          <month>07</month>
          <volume>40</volume>
          <issue>7</issue>
          <fpage>2102</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22584764"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0b013e318250aa5a</pub-id>
          <pub-id pub-id-type="medline">22584764</pub-id>
          <pub-id pub-id-type="pmcid">PMC3378796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Takala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Willatts</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>De Mendonça</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bruining</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Reinhart</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Suter</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Thijs</surname>
              <given-names>LG</given-names>
            </name>
          </person-group>
          <article-title>The SOFA (sepsis-related organ failure assessment) score to describe organ dysfunction/failure</article-title>
          <source>Intensive Care Med</source>
          <year>1996</year>
          <month>07</month>
          <volume>22</volume>
          <issue>7</issue>
          <fpage>707</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1007/BF01709751</pub-id>
          <pub-id pub-id-type="medline">8844239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>NEWSDIG: The national early warning score development and implementation group</article-title>
          <source>Clin Med (Lond)</source>
          <year>2012</year>
          <month>12</month>
          <volume>12</volume>
          <issue>6</issue>
          <fpage>501</fpage>
          <lpage>3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23342400"/>
          </comment>
          <pub-id pub-id-type="doi">10.7861/clinmedicine.12-6-501</pub-id>
          <pub-id pub-id-type="medline">23342400</pub-id>
          <pub-id pub-id-type="pmcid">PMC5922584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Six</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Backus</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Kelder</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Chest pain in the emergency room: value of the HEART score</article-title>
          <source>Neth Heart J</source>
          <year>2008</year>
          <month>06</month>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>191</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18665203"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/BF03086144</pub-id>
          <pub-id pub-id-type="medline">18665203</pub-id>
          <pub-id pub-id-type="pmcid">PMC2442661</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Charlson</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Pompei</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ales</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>MacKenzie</surname>
              <given-names>CR</given-names>
            </name>
          </person-group>
          <article-title>A new method of classifying prognostic comorbidity in longitudinal studies: development and validation</article-title>
          <source>J Chronic Dis</source>
          <year>1987</year>
          <volume>40</volume>
          <issue>5</issue>
          <fpage>373</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.1016/0021-9681(87)90171-8</pub-id>
          <pub-id pub-id-type="medline">3558716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Navar</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Pencina</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannidis</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Opportunities and challenges in developing risk prediction models with electronic health records data: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2017</year>
          <month>01</month>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>198</fpage>
          <lpage>208</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27189013"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocw042</pub-id>
          <pub-id pub-id-type="medline">27189013</pub-id>
          <pub-id pub-id-type="pii">ocw042</pub-id>
          <pub-id pub-id-type="pmcid">PMC5201180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heinze</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wallisch</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dunkler</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Variable selection - a review and recommendations for the practicing statistician</article-title>
          <source>Biom J</source>
          <year>2018</year>
          <month>05</month>
          <volume>60</volume>
          <issue>3</issue>
          <fpage>431</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29292533"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/bimj.201700067</pub-id>
          <pub-id pub-id-type="medline">29292533</pub-id>
          <pub-id pub-id-type="pmcid">PMC5969114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sanchez-Pinto</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Venable</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Fahrenbach</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Churpek</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Comparison of variable selection methods for clinical predictive modeling</article-title>
          <source>Int J Med Inform</source>
          <year>2018</year>
          <month>08</month>
          <volume>116</volume>
          <fpage>10</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29887230"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.05.006</pub-id>
          <pub-id pub-id-type="medline">29887230</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)30581-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6003624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vellido</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The importance of interpretability and visualization in machine learning for applications in medicine and health care</article-title>
          <source>Neural Comput Applic</source>
          <year>2019</year>
          <month>02</month>
          <day>4</day>
          <fpage>-</fpage>
          <comment>epub ahead of print</comment>
          <pub-id pub-id-type="doi">10.1007/s00521-019-04051-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Phelan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lambert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bedoya</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Steorts</surname>
              <given-names>RC</given-names>
            </name>
          </person-group>
          <article-title>Development, implementation, and evaluation of an in-hospital optimized early warning score for patient deterioration</article-title>
          <source>MDM Policy Pract</source>
          <year>2020</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>2381468319899663</fpage>
          <pub-id pub-id-type="doi">10.1177/2381468319899663</pub-id>
          <pub-id pub-id-type="medline">31976373</pub-id>
          <pub-id pub-id-type="pii">10.1177_2381468319899663</pub-id>
          <pub-id pub-id-type="pmcid">PMC6956604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Low</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Thumboo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>FAM-FACE-SG: a score for risk stratification of frequent hospital admitters</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2017</year>
          <month>04</month>
          <day>8</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-017-0441-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0441-5</pub-id>
          <pub-id pub-id-type="medline">28390405</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-017-0441-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5385059</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Massaro</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>Presentation of multivariate data for clinical use: the Framingham study risk score functions</article-title>
          <source>Stat Med</source>
          <year>2004</year>
          <month>05</month>
          <day>30</day>
          <volume>23</volume>
          <issue>10</issue>
          <fpage>1631</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1002/sim.1742</pub-id>
          <pub-id pub-id-type="medline">15122742</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tin</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Random Decision Forests</article-title>
          <year>1995</year>
          <conf-name>International Conference on Document Analysis and Recognition</conf-name>
          <conf-date>August 14-16, 1995</conf-date>
          <conf-loc>Montreal, Quebec, Canada</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icdar.1995.598994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Vahdatpour</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>CJ</given-names>
            </name>
            <collab>Population Health Metrics Research Consortium (PHMRC)</collab>
          </person-group>
          <article-title>Random forests for verbal autopsy analysis: multisite validation study using clinical diagnostic gold standards</article-title>
          <source>Popul Health Metr</source>
          <year>2011</year>
          <month>08</month>
          <day>4</day>
          <volume>9</volume>
          <fpage>29</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pophealthmetrics.biomedcentral.com/articles/10.1186/1478-7954-9-29"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1478-7954-9-29</pub-id>
          <pub-id pub-id-type="medline">21816105</pub-id>
          <pub-id pub-id-type="pii">1478-7954-9-29</pub-id>
          <pub-id pub-id-type="pmcid">PMC3160922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Olshen</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Classification and Regression Trees</source>
          <year>1984</year>
          <publisher-loc>New York, USA</publisher-loc>
          <publisher-name>Taylor &#38; Francis</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biau</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Analysis of a random forests model</article-title>
          <source>J Mach Learn Res</source>
          <year>2012</year>
          <volume>13</volume>
          <fpage>1063</fpage>
          <lpage>95</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Genuer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Poggi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tuleau-Malot</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Variable selection using random forests</article-title>
          <source>Pattern Recogn Letters</source>
          <year>2010</year>
          <month>10</month>
          <volume>31</volume>
          <issue>14</issue>
          <fpage>2225</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1016/j.patrec.2010.03.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Louppe</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wehenkel</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sutera</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Geurts</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Understanding Variable Importances in Forests of Randomized Trees</article-title>
          <source>Advances in Neural Information Processing Systems</source>
          <year>2013</year>
          <conf-name>NIPS'13</conf-name>
          <conf-date>December 5-10, 2013</conf-date>
          <conf-loc>Lake Tahoe, Nevada</conf-loc>
          <fpage>431</fpage>
          <lpage>9</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>AutoScore: A Machine Learning-Based Automatic Clinical Score Generator</article-title>
          <source>GitHub</source>
          <access-date>2020-09-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/nliulab/AutoScore">https://github.com/nliulab/AutoScore</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>SX</given-names>
            </name>
            <name name-style="western">
              <surname>Ang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Low</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Matchar</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Novel model for predicting inpatient mortality after emergency admission to hospital in Singapore: retrospective observational study</article-title>
          <source>BMJ Open</source>
          <year>2019</year>
          <month>09</month>
          <day>26</day>
          <volume>9</volume>
          <issue>9</issue>
          <fpage>e031382</fpage>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2019-031382</pub-id>
          <pub-id pub-id-type="medline">31558458</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2019-031382</pub-id>
          <pub-id pub-id-type="pmcid">PMC6773418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Redfern</surname>
              <given-names>OC</given-names>
            </name>
            <name name-style="western">
              <surname>Pimentel</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Prytherch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meredith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Clifton</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Tarassenko</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Watkinson</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Predicting in-hospital mortality and unanticipated admissions to the intensive care unit using routinely collected blood tests and vital signs: development and validation of a multivariable model</article-title>
          <source>Resuscitation</source>
          <year>2018</year>
          <month>12</month>
          <volume>133</volume>
          <fpage>75</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0300-9572(18)30909-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.resuscitation.2018.09.021</pub-id>
          <pub-id pub-id-type="medline">30253229</pub-id>
          <pub-id pub-id-type="pii">S0300-9572(18)30909-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6562198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>James</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Witten</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>An Introduction to Statistical Learning: with Applications in R</source>
          <year>2013</year>
          <publisher-loc>New York, USA</publisher-loc>
          <publisher-name>Springer New York</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Regression shrinkage and selection via the lasso</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>2018</year>
          <month>12</month>
          <day>5</day>
          <volume>58</volume>
          <issue>1</issue>
          <fpage>267</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oshiro</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Baranauskas</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>How Many Trees in a Random Forest?</article-title>
          <source>Machine Learning and Data Mining in Pattern Recognition</source>
          <year>2012</year>
          <volume>Berlin, Heidelberg</volume>
          <fpage>154</fpage>
          <lpage>168</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-642-31537-4_13</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Probst</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>To tune or not to tune the number of trees in random forest</article-title>
          <source>The Journal of Machine Learning Research</source>
          <year>2017</year>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>6673</fpage>
          <lpage>6690</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nattino</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Finazzi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bertolini</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A new test and graphical tool to assess the goodness of fit of logistic regression models</article-title>
          <source>Stat Med</source>
          <year>2016</year>
          <month>02</month>
          <day>28</day>
          <volume>35</volume>
          <issue>5</issue>
          <fpage>709</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1002/sim.6744</pub-id>
          <pub-id pub-id-type="medline">26439593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Henriksson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Asker</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Boström</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Predictive modeling of structured electronic health records for adverse drug event detection</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2015</year>
          <volume>15</volume>
          <issue>Suppl 4</issue>
          <fpage>S1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/1472-6947-15-S4-S1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6947-15-S4-S1</pub-id>
          <pub-id pub-id-type="medline">26606038</pub-id>
          <pub-id pub-id-type="pii">1472-6947-15-S4-S1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4660129</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bagherzadeh-Khiabani</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ramezankhani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hadaegh</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Khalili</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A tutorial on variable selection for clinical prediction models: feature selection methods in data mining could improve the results</article-title>
          <source>J Clin Epidemiol</source>
          <year>2016</year>
          <month>03</month>
          <volume>71</volume>
          <fpage>76</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2015.10.002</pub-id>
          <pub-id pub-id-type="medline">26475568</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(15)00466-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Koh</surname>
              <given-names>ZX</given-names>
            </name>
            <name name-style="western">
              <surname>Goh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Haaland</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>BP</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Prediction of adverse cardiac events in emergency department patients with chest pain using machine learning for variable selection</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2014</year>
          <month>08</month>
          <day>23</day>
          <volume>14</volume>
          <fpage>75</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/1472-6947-14-75"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6947-14-75</pub-id>
          <pub-id pub-id-type="medline">25150702</pub-id>
          <pub-id pub-id-type="pii">1472-6947-14-75</pub-id>
          <pub-id pub-id-type="pmcid">PMC4150554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salonia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abdollah</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Capitanio</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Suardi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Briganti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gallina</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Colombo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Castagna</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rigatti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Montorsi</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Serum sex steroids depict a nonlinear u-shaped association with high-risk prostate cancer at radical prostatectomy</article-title>
          <source>Clin Cancer Res</source>
          <year>2012</year>
          <month>07</month>
          <day>1</day>
          <volume>18</volume>
          <issue>13</issue>
          <fpage>3648</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-11-2799</pub-id>
          <pub-id pub-id-type="medline">22589393</pub-id>
          <pub-id pub-id-type="pii">1078-0432.CCR-11-2799</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mahara</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A novel approach to determine two optimal cut-points of a continuous predictor with a U-shaped relationship to hazard ratio in survival data: simulation and application</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2019</year>
          <month>05</month>
          <day>9</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>96</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-019-0738-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-019-0738-4</pub-id>
          <pub-id pub-id-type="medline">31072334</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-019-0738-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6507062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mabikwa</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>Greenwood</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Baxter</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Assessing the reporting of categorised quantitative variables in observational epidemiological studies</article-title>
          <source>BMC Health Serv Res</source>
          <year>2017</year>
          <month>03</month>
          <day>14</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>201</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmchealthservres.biomedcentral.com/articles/10.1186/s12913-017-2137-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12913-017-2137-z</pub-id>
          <pub-id pub-id-type="medline">28288628</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12913-017-2137-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC5348776</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schellingerhout</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Heymans</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>de Vet</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Koes</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Categorizing continuous variables resulted in different predictors in a prognostic model for nonspecific neck pain</article-title>
          <source>J Clin Epidemiol</source>
          <year>2009</year>
          <month>08</month>
          <volume>62</volume>
          <issue>8</issue>
          <fpage>868</fpage>
          <lpage>74</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2008.10.010</pub-id>
          <pub-id pub-id-type="medline">19230604</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(08)00322-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Donders</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van der Heijden</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stijnen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Review: a gentle introduction to imputation of missing values</article-title>
          <source>J Clin Epidemiol</source>
          <year>2006</year>
          <month>10</month>
          <volume>59</volume>
          <issue>10</issue>
          <fpage>1087</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2006.01.014</pub-id>
          <pub-id pub-id-type="medline">16980149</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(06)00197-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murtaugh</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Methods of variable selection in regression modeling</article-title>
          <source>Commun Stat - Simul Comput</source>
          <year>2010</year>
          <month>12</month>
          <day>23</day>
          <volume>27</volume>
          <issue>3</issue>
          <fpage>711</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1080/03610919808813505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Austin</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>JV</given-names>
            </name>
          </person-group>
          <article-title>Bootstrap methods for developing predictive models</article-title>
          <source>Am Stat</source>
          <year>2004</year>
          <month>05</month>
          <volume>58</volume>
          <issue>2</issue>
          <fpage>131</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1198/0003130043277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hajaj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hardt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sundberg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Irvine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Litsch</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mossin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tansuwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wexler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volchenboum</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madabushi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scalable and accurate deep learning with electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <volume>1</volume>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31304302"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id>
          <pub-id pub-id-type="medline">31304302</pub-id>
          <pub-id pub-id-type="pii">29</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thorsen-Meyer</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Kaas-Hansen</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Toft</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schierbeck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Strøm</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chmura</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Heimann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dybdahl</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Spangsege</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hulsen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Belling</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brunak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perner</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Dynamic and explainable machine learning prediction of mortality in patients in the intensive care unit: a retrospective study of high-frequency data in electronic patient records</article-title>
          <source>Lancet Digit Health</source>
          <year>2020</year>
          <month>04</month>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>e179</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1016/s2589-7500(20)30018-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klug</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Barash</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bechler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Resheff</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Tron</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ironi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soffer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zimlichman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A gradient boosting machine learning model for predicting early mortality in the emergency department triage: devising a nine-point triage score</article-title>
          <source>J Gen Intern Med</source>
          <year>2020</year>
          <month>01</month>
          <volume>35</volume>
          <issue>1</issue>
          <fpage>220</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1007/s11606-019-05512-7</pub-id>
          <pub-id pub-id-type="medline">31677104</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-019-05512-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6957629</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spangler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hermansson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Smekal</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Blomberg</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A validation of machine learning-based risk scores in the prehospital setting</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>12</issue>
          <fpage>e0226518</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0226518"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0226518</pub-id>
          <pub-id pub-id-type="medline">31834920</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-25317</pub-id>
          <pub-id pub-id-type="pmcid">PMC6910679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead</article-title>
          <source>Nat Mach Intell</source>
          <year>2019</year>
          <month>05</month>
          <day>13</day>
          <volume>1</volume>
          <issue>5</issue>
          <fpage>206</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-019-0048-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Subbe</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Kruger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rutherford</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gemmel</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Validation of a modified early warning score in medical admissions</article-title>
          <source>QJM</source>
          <year>2001</year>
          <month>10</month>
          <volume>94</volume>
          <issue>10</issue>
          <fpage>521</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1093/qjmed/94.10.521</pub-id>
          <pub-id pub-id-type="medline">11588210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prytherch</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Featherstone</surname>
              <given-names>PI</given-names>
            </name>
          </person-group>
          <article-title>ViEWS--towards a national early warning score for detecting adult inpatient deterioration</article-title>
          <source>Resuscitation</source>
          <year>2010</year>
          <month>08</month>
          <volume>81</volume>
          <issue>8</issue>
          <fpage>932</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.resuscitation.2010.04.014</pub-id>
          <pub-id pub-id-type="medline">20637974</pub-id>
          <pub-id pub-id-type="pii">S0300-9572(10)00242-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zimmerman</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>McNair</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Malila</surname>
              <given-names>FM</given-names>
            </name>
          </person-group>
          <article-title>Acute physiology and chronic health evaluation (APACHE) IV: hospital mortality assessment for today's critically ill patients</article-title>
          <source>Crit Care Med</source>
          <year>2006</year>
          <month>05</month>
          <volume>34</volume>
          <issue>5</issue>
          <fpage>1297</fpage>
          <lpage>310</lpage>
          <pub-id pub-id-type="doi">10.1097/01.CCM.0000215112.84523.F0</pub-id>
          <pub-id pub-id-type="medline">16540951</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hendriksen</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Geersing</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>de Groot</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic and prognostic prediction models</article-title>
          <source>J Thromb Haemost</source>
          <year>2013</year>
          <month>06</month>
          <volume>11</volume>
          <issue>Suppl 1</issue>
          <fpage>129</fpage>
          <lpage>41</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/jth.12262"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jth.12262</pub-id>
          <pub-id pub-id-type="medline">23809117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Khanal</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Development of scoring system for risk stratification in clinical medicine: a step-by-step tutorial</article-title>
          <source>Ann Transl Med</source>
          <year>2017</year>
          <month>11</month>
          <volume>5</volume>
          <issue>21</issue>
          <fpage>436</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.21037/atm.2017.08.22"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/atm.2017.08.22</pub-id>
          <pub-id pub-id-type="medline">29201888</pub-id>
          <pub-id pub-id-type="pii">atm-05-21-436</pub-id>
          <pub-id pub-id-type="pmcid">PMC5690964</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Austin</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>JV</given-names>
            </name>
          </person-group>
          <article-title>Automated variable selection methods for logistic regression produced unstable models for predicting acute myocardial infarction mortality</article-title>
          <source>J Clin Epidemiol</source>
          <year>2004</year>
          <month>11</month>
          <volume>57</volume>
          <issue>11</issue>
          <fpage>1138</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2004.04.003</pub-id>
          <pub-id pub-id-type="medline">15567629</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(04)00111-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahmoudi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kamdar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzales</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Waljee</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Use of electronic medical records in development and validation of risk prediction models of hospital readmission: systematic review</article-title>
          <source>Br Med J</source>
          <year>2020</year>
          <month>04</month>
          <day>8</day>
          <volume>369</volume>
          <fpage>m958</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.m958</pub-id>
          <pub-id pub-id-type="medline">32269037</pub-id>
          <pub-id pub-id-type="pmcid">PMC7249246</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
