<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i12e25022</article-id>
      <article-id pub-id-type="pmid">34889756</article-id>
      <article-id pub-id-type="doi">10.2196/25022</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>On Missingness Features in Machine Learning Models for Critical Care: Observational Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Hefner</surname>
            <given-names>Jennifer</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Maslove</surname>
            <given-names>David</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Che</surname>
            <given-names>Zhengping</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Weber</surname>
            <given-names>Griffin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>Janmajay</given-names>
          </name>
          <degrees>BTECH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Fuji Xerox Co, Ltd</institution>
            <addr-line>6 Chome-1-1 Minatomirai</addr-line>
            <addr-line>Nishi Ward</addr-line>
            <addr-line>Yokohama, 220-0012</addr-line>
            <country>Japan</country>
            <phone>81 7041120526</phone>
            <email>janmajaysingh14@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6891-8182</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Sato</surname>
            <given-names>Masahiro</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0000-6341</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>Tomoko</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5078-4814</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Fuji Xerox Co, Ltd</institution>
        <addr-line>Yokohama</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Janmajay Singh <email>janmajaysingh14@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>12</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>12</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>12</issue>
      <elocation-id>e25022</elocation-id>
      <history>
        <date date-type="received">
          <day>14</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>22</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>17</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>2</day>
          <month>9</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Janmajay Singh, Masahiro Sato, Tomoko Ohkuma. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 08.12.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/12/e25022" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Missing data in electronic health records is inevitable and considered to be nonrandom. Several studies have found that features indicating missing patterns (missingness) encode useful information about a patient’s health and advocate for their inclusion in clinical prediction models. But their effectiveness has not been comprehensively evaluated.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The goal of the research is to study the effect of including informative missingness features in machine learning models for various clinically relevant outcomes and explore robustness of these features across patient subgroups and task settings.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A total of 48,336 electronic health records from the 2012 and 2019 PhysioNet Challenges were used, and mortality, length of stay, and sepsis outcomes were chosen. The latter dataset was multicenter, allowing external validation. Gated recurrent units were used to learn sequential patterns in the data and classify or predict labels of interest. Models were evaluated on various criteria and across population subgroups evaluating discriminative ability and calibration.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Generally improved model performance in retrospective tasks was observed on including missingness features. Extent of improvement depended on the outcome of interest (area under the curve of the receiver operating characteristic [AUROC] improved from 1.2% to 7.7%) and even patient subgroup. However, missingness features did not display utility in a simulated prospective setting, being outperformed (0.9% difference in AUROC) by the model relying only on pathological features. This was despite leading to earlier detection of disease (true positives), since including these features led to a concomitant rise in false positive detections.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study comprehensively evaluated effectiveness of missingness features on machine learning models. A detailed understanding of how these features affect model performance may lead to their informed use in clinical settings especially for administrative tasks like length of stay prediction where they present the greatest benefit. While missingness features, representative of health care processes, vary greatly due to intra- and interhospital factors, they may still be used in prediction models for clinically relevant outcomes. However, their use in prospective models producing frequent predictions needs to be explored further.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>electronic health records</kwd>
        <kwd>informative missingness</kwd>
        <kwd>machine learning</kwd>
        <kwd>missing data</kwd>
        <kwd>hospital mortality</kwd>
        <kwd>sepsis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The increasing availability of electronic health record (EHR) data collected from hospitals, especially from their intensive care units (ICU), has encouraged the development of various models for disease diagnosis [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Machine learning and specifically deep learning models, given their ability to adequately learn nonlinear representations and temporal patterns from large amounts of data, have been widely applied to capture complex physiological processes, and several works have demonstrated their usefulness [<xref ref-type="bibr" rid="ref5">5</xref>]. Most works use retrospective observational data to train supervised models for a variety of clinically important outcomes like mortality or sepsis. Some more recent works have also developed models more suited to actual clinical needs by evaluating models prospectively and using early warning scores as baselines [<xref ref-type="bibr" rid="ref6">6</xref>]. Models used to learn human physiological processes from EHRs tackle intrinsic problems in health care data, particularly that of irregular sampling and large amount of missing information [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>Several methods have been developed to handle the inevitably large amount of missing data in EHRs. Simpler methods like incomplete record deletion (also called complete case analysis) propose to simply delete those records where any value is missing. Various imputation techniques ranging from simple mean imputation to sophisticated methods like multiple imputation with chained equations are also commonly used [<xref ref-type="bibr" rid="ref8">8</xref>]. More recently, deep learning models have been proposed to learn the underlying process generating the data as a method for better inferring missing values [<xref ref-type="bibr" rid="ref9">9</xref>]. A consensus regarding a best universal model to handle missing data does not exist in literature, and it is generally understood to depend heavily on the task and the nature of the data itself. However, a returning consideration in all studies on missing data is the nature of missingness. In Rubin [<xref ref-type="bibr" rid="ref10">10</xref>], missing data were classified into 3 categories: missing completely at random, missing at random, and missing not at random. The nature of missingness in EHRs has been generally understood to belong to the last category, missing not at random [<xref ref-type="bibr" rid="ref11">11</xref>]. This means that missing values cannot be inferred using observed values, subjecting all methods to problems of bias.</p>
        <p>Considering the inevitability of bias, methods seek to minimize it by considering imputed value uncertainty or developing more sophisticated processes to learn underlying distributions [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. A returning simple yet effective motif in deep learning models for EHRs is to use informative missingness (IM) features. First introduced in Lin and Haug [<xref ref-type="bibr" rid="ref11">11</xref>], the method has repeatedly been shown to improve performance of health care models for a variety of outcomes [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. A particularly efficient use was demonstrated in Lipton et al [<xref ref-type="bibr" rid="ref13">13</xref>], where simply augmenting zero-imputed data with corresponding binary missingness indicators greatly improved over the baseline model. The basic assumption underlying the use of IM features is that the inclusion of health care process variables like laboratory tests conducted or drugs prescribed provides important information about the state and evolution of a patient’s health. These variables are usually inputted to the model as binary indicators of observation/missingness, but some studies have also propounded modifying or augmenting this representation to include additional information such as time since last observation [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. We use the term health care process variables interchangeably with IM features.</p>
        <p>This use of health care process variables as feasible features to model patient health is supported by studies spanning several decades and countries, indicating that test ordering behavior and drug prescriptions are associated with the underlying pathology. For example, Kristiansen et al [<xref ref-type="bibr" rid="ref19">19</xref>] established that the medical condition at hand was the strongest determinant of test ordering behavior, and Weiskopf et al [<xref ref-type="bibr" rid="ref20">20</xref>] and Rusanov et al [<xref ref-type="bibr" rid="ref21">21</xref>] found a statistically significant relationship between data completeness and patient health status, finding that those susceptible to adverse outcomes have more information collected. A recent study also highlighted that EHR data are observational and display a patient’s interactions with the health care system and thus any information from there can only serve as a proxy measure of the patient’s true state [<xref ref-type="bibr" rid="ref22">22</xref>]. They further found that the presence of laboratory test orders, regardless of other information like numerical test values, had a significant association with odds of 3-year survival. This suggests that laboratory test orders encode information separately from laboratory test results, as corroborated by Pivovarov et al [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>Despite improvements in model performance on including IM features, their use is considered to have limited applicability. Missing information may occur due to several factors, not all which pertain to patient pathology or a physician’s mental model of the diagnosis process. Within a hospital, some tests may be conducted following general guidelines or as standard practice for all patients regardless of underlying condition [<xref ref-type="bibr" rid="ref23">23</xref>]. Physicians also vary by years of experience and attitudes in coping with uncertainty, which has been shown to affect test ordering behavior [<xref ref-type="bibr" rid="ref24">24</xref>]. In addition, variations between hospitals as test ordering may depend on resource constraints and variations due to geographic separation as ICU case-mix changes are further exacerbated when making international comparisons [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. And while machine learning models rely on improved performance on chosen metrics as a justification for continued use of IM features, evaluation has mostly been on single-center data under retrospective task settings. Even where multicenter data are used, hospitals are often not geographically distinct, preventing the assessment of model generalization to different demographic mixes and practices. Also, only recently have some works evaluated their models prospectively, better reflecting real-world clinical utility, but evaluation metrics differ across studies, some choosing to use the concordance index (also called the area under receiver operating curve [AUROC]) while others prefer the area under precision recall curve [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        <p>The ways in which use of IM features is supported and challenged creates an apparent disjunction and casts doubts on their true usefulness. This was perhaps exemplified in the PhysioNet 2019 Challenge [<xref ref-type="bibr" rid="ref29">29</xref>] for early prediction of sepsis, which saw many submissions using some modification of IM features [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. The challenge was designed to evaluate models on prospective prediction performance and used datasets from 3 geographically distinct hospital systems, one of which was never provided to the participants. While several models had reasonable performance on hospitals they had at least partial access to, scores dropped substantially on the third, unseen hospital. Models using more sophisticated modifications of IM features saw a larger drop than those using simple binary variables or no representation of health care processes.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this study we seek to empirically verify and understand the effect that including IM features has on health care machine learning models. We selected 3 common outcomes of interest, mortality, length-of-stay, and sepsis, and trained models for 2 task settings. The first, shared by all outcomes, is entire record classification where the model provides a prediction at the end of a patient’s ICU stay. The second is hourly prediction of label, and only the sepsis label is used for this task.</p>
        <p>We verify the effect of IM feature inclusion on performance, generalizability, and clinical utility of models in 3 steps. First, to get a comprehensive understanding of model performance, binary classification models for each of the outcomes were trained and evaluated using multiple metrics. Since class imbalance varies between outcomes, we could also evaluate model robustness. Second, for the sepsis outcome, since data from 2 distinct hospital systems were available, we could evaluate model generalizability and test whether that is affected by IM features. Third, again for the sepsis outcome, since labels for every hour of patient data were available, we trained a model for temporal prediction of sepsis. We evaluated this model on the hidden hospital system’s data in a simulated prospective manner, in the process understanding how the models would behave in an actual clinical setting and what differences in performance can be expected by including IM features.</p>
        <p>Finally, we hypothesized that health care processes vary across patient demographics and ICU types, which may result in varying missingness rates and patterns across subgroups. Previous works have shown how laboratory variation (and thus test ordering behavior) may vary based on these criteria; this was also seen in our data analysis [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. Thus, we were motivated to see model performances for different subgroups, as well as to study the different extent to which IM features improve model performance within a subgroup. Based on our data analysis, age and ICU type subgroups were chosen. Since testing was also done on the hidden hospital, we could see how generalization on subgroups is affected by including IM. We could also verify whether models can use IM features to capture the relationship between test ordering and patient pathophysiology despite intra- and interhospital variations.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>In this section we describe the datasets used for this study and the preprocessing pipeline. We also describe how outcomes of interest were defined. This is followed by an overview of the task settings and experiments with model implementation details.</p>
      <sec>
        <title>Datasets</title>
        <p>Data from the PhysioNet 2012 and 2019 Challenges were used for this study. From the PhysioNet 2012 [<xref ref-type="bibr" rid="ref34">34</xref>] dataset (P12), we used patient records from training set A and open test set B, each consisting of data from 4000 patients collected from 4 types of ICUs. Several patient outcomes are provided of which we selected in-hospital death (mortality) and length of stay (number of days between patient’s admission to the ICU and end of hospitalization, LOS). We binarized the LOS outcome setting as 3 days as a heuristic decision threshold, similar to previous studies [<xref ref-type="bibr" rid="ref14">14</xref>]. The data consist of static patient descriptors as well as temporal variables representing patient vitals (low missingness) and values from laboratory tests conducted (high missingness). Imbalance ratios of mortality and LOS were different, at 13.9% and 6.5%, respectively, for set A and 14.2% and 7.0%, respectively, for set B. Since P12 was extracted from the MIMIC II (Multiparameter Intelligent Monitoring in Intensive Care) Clinical Database [<xref ref-type="bibr" rid="ref35">35</xref>], the data were from one hospital system only.</p>
        <p>The PhysioNet 2019 [<xref ref-type="bibr" rid="ref29">29</xref>] dataset (P19) comprised patient records from 3 geographically distinct US hospital systems. A total of 40,336 patient records, 20,336 from hospital A (set A) and 20,000 from hospital B (set B), from 2 ICU types were used. Data from hospital C were not available for download. Since the challenge was aimed at model development for early prediction of sepsis, a corresponding binary label is provided for every hour of the patient’s record. Labeling was done in accordance with the Third International Consensus Definitions for Sepsis and Septic Shock (Sepsis-3) criteria [<xref ref-type="bibr" rid="ref36">36</xref>]. It is important to note that to facilitate training models for early prediction, patients who eventually developed sepsis were labeled as such starting 6 hours before a confirmed diagnosis. More details about the definition of the sepsis label may be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Available variables in the dataset are similar to that in P12, describing static as well as temporal patient features with varying missingness. The cohort from hospital A consisted of 8.8% of patients who developed sepsis while it was 5.7% for hospital B. Due to the cohort selection procedure followed by Reyna et al [<xref ref-type="bibr" rid="ref29">29</xref>], few patients have sepsis from the start of ICU admission. Only 2.2% of hourly records for hospital A and 1.4% for hospital B are labeled as corresponding to sepsis. For analysis of the extent of missingness in the various datasets, please see Figures S1-S5 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
      </sec>
      <sec>
        <title>Preprocessing</title>
        <p>Data preprocessing was done using a similar pipeline as described in multiple previous studies [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Data from P12 were resampled on an hourly basis, while P19 data were already resampled. While resampling, some patient records were found to have static descriptors only and others had missing outcome labels in both sets of P12. These were removed, leaving 3997 patient records in set A and 3993 in set B. Invasive and noninvasive measurements of the same variable present in P12 were averaged to form aggregate measurements. In P19, end tidal carbon dioxide was a variable observed in only hospital B, so it was removed from consideration. Static patient features describing age, gender, or ICU type identifiers were not used as inputs. This left us with 33 features in P12 and 34 in P19, which were used for model training. To deal with missing data, zero imputation was performed in both datasets, since Lipton et al [<xref ref-type="bibr" rid="ref13">13</xref>] showed that this simple strategy proved quite effective when used to train deep learning models.</p>
        <p>For model training and evaluation, training and testing sets were identified. Set A from both datasets was used for training while set B was shown to the model only for final evaluation. It is worth noting again that set B in P19 belonged to a distinct hospital system. Data were standardized before inputting to the model. Mean and variance from training data were used to standardize corresponding test data.</p>
        <p>Finally, we describe the derivation of features to represent missingness. We selected the simplest representation using binary indicator variables, with a 1 used to denote variable observation and a 0 otherwise. Every feature described earlier had a corresponding missingness indicator that was appended to the feature vector as in Lipton et al [<xref ref-type="bibr" rid="ref13">13</xref>]. This resulted in 66 features for P12 and 68 for P19.</p>
      </sec>
      <sec>
        <title>Modeling Methodology</title>
        <p>Since patient pathophysiology evolves nonlinearly over time, sequential models like recurrent neural networks (RNN) are considered suitable and have often been used in previous works [<xref ref-type="bibr" rid="ref38">38</xref>]. We used a gated RNN variant, specifically a gated recurrent unit (GRU) to model long EHR sequences [<xref ref-type="bibr" rid="ref39">39</xref>]. A multilayer perceptron followed by a sigmoid layer were used after the GRU to output binary label probabilities.</p>
        <p>The model was implemented in Pytorch [<xref ref-type="bibr" rid="ref40">40</xref>] and trained using minibatch gradient descent to minimize binary cross entropy loss with Adam [<xref ref-type="bibr" rid="ref41">41</xref>] as the optimizer. Models trained with IM augmented features are denoted by masking while those trained with patient physiological features only are denoted by no masking.</p>
        <p>We performed 5-fold stratified cross validation for hyperparameter tuning and to prevent model overfitting. To tune hyperparameters, we performed an iterative ranging investigation to determine a suitable grid followed by a grid search [<xref ref-type="bibr" rid="ref42">42</xref>]. Maximum averaged AUROC and utility score across all folds were chosen as the criteria for hyperparameter set selection for the retrospective and simulated prospective tasks, respectively [<xref ref-type="bibr" rid="ref29">29</xref>]. No attempt was made to tune model architecture as our focus was not to propose a new model but to evaluate IM feature effectiveness.</p>
      </sec>
      <sec>
        <title>Task Settings</title>
        <p>We analyzed the effectiveness of including IM features by defining 2 tasks, (1) retrospective classification where we verify IM usefulness on model performance, calibration, and generalizability and (2) simulated prospective classification to study IM effect on model prediction trends in a temporal manner.</p>
        <sec>
          <title>Retrospective Classification</title>
          <p>In this setting, the model is trained to predict the appropriate label at the end of a patient’s hospital stay. For this purpose, mortality and LOS labels were used directly from the outcomes provided in P12. For P19, a sepsis-overall label was derived from the hourly labels provided. If a patient developed sepsis at any time, their entire record was marked as positive for sepsis. The task for all 3 labels was binary classification after using the entire patient record as input. We studied the effect of IM in 2 steps, overall classification and subgroup analysis:</p>
          <list list-type="bullet">
            <list-item>
              <p>To verify changes in performance on IM inclusion, the models were evaluated on all of the testing data for all datasets and labels. Multiple evaluation metrics were used to understand how IM features change performance and calibration while data from a distinct hospital were used to evaluate changes in model generalizability.</p>
            </list-item>
            <list-item>
              <p>To study extent of improvement on different patient subgroups, models were trained on all of the training data (representative of a general ICU population) and evaluated on identified subgroups made from the test set. Both datasets provided 3 general patient descriptors: age, gender, and ICU type. Visual comparison of variable observation differences between these strata was performed. Gender showed no substantial difference in variable observation. Different ICU types displayed clear differences as did age after binning into suitable intervals (Figures S6-S11 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). These strata were chosen for subgroup analysis.</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>Simulated Prospective Classification</title>
          <p>Only P19 was used for this task since P12 did not have hourly labels. The model was trained to predict patient probability of sepsis at every hour using the shifted labels provided in the dataset. At time <italic>t</italic>, information from the beginning of the patient record to <italic>t</italic> was used to make a prediction. This ensured prospective usefulness of the model. Since the model was trained on labels shifted by 6 hours (for septic patients), we expected the model to learn early signs of sepsis onset. The sepsis-overall label described earlier was used for cross-validation and hyperparameter tuning.</p>
        </sec>
      </sec>
      <sec>
        <title>Performance Evaluation</title>
        <p>Model discriminative ability was judged by the concordance index or AUROC. Since this is known to be an over optimistic measure for imbalanced datasets [<xref ref-type="bibr" rid="ref43">43</xref>], we also use the precision-recall curve and average precision to evaluate predictive value [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Finally, 2 measures were used to assess model calibration: reliability plots and Brier score. The former was useful to visualize calibration changes against different levels of model uncertainty. The latter was used to quantify an averaged deviation from true probabilities and as a convenient summary of uncertainty, resolution, and reliability [<xref ref-type="bibr" rid="ref46">46</xref>]. We also visualized the number of samples in each bin of the reliability plots by varying marker area proportional to the squared root of the bin size scaled by a constant factor. Finally, AUROC and Brier score were reported with 95% confidence intervals computed with 10,000 bootstrap replications to obtain a good estimation of model performance up to the second significant digit [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Retrospective Classification</title>
        <sec>
          <title>Overall Classification</title>
          <p>The first 3 rows of <xref ref-type="table" rid="table1">Table 1</xref> summarize results for the overall classification tasks. Including IM resulted in considerable improvements over using patient physiological features only for both tasks on P12 and the sepsis-overall task on P19. The extent of improvement in average precision mimicked trends of improvements in AUROC. The no masking model had an average precision of 0.493 on the P12 mortality task, and including IM features improved this to 0.511. The performance gain was more marked for the P12 LOS task, as average precision was 0.173 without and 0.368 with masking. It is worth noting that the derived LOS label in P12 had higher class imbalance than the mortality label for the same dataset. The P19 sepsis-overall task also saw an improvement in average precision where the no masking model achieved 0.537 and this was 0.547 for the masking model. Panels A and B of <xref rid="figure1" ref-type="fig">Figures 1</xref>-<xref rid="figure3" ref-type="fig">3</xref> graphically show the receiver operating characteristic and PR curves for these tasks.</p>
          <p>Including IM features also improved model calibration scores in all 3 cases, as seen by the Brier score (lower is better). The improved Brier scores (0.039 with IM features vs 0.045 without) for the P19 sepsis-overall task where evaluation was on a distinct hospital suggests that the model does not overfit to hospital-specific health care process variables. Examining panel C of <xref rid="figure1" ref-type="fig">Figures 1</xref>-<xref rid="figure3" ref-type="fig">3</xref> shows the calibration plots for each task setting. The 2 models had very similar plots for the P12 mortality task. The difference was again most pronounced for the P12 LOS task, where the masking model had better calibration at higher model certainties (predicted probabilities). The masking model also showed improved calibration for the P19 sepsis-overall task seen in <xref rid="figure3" ref-type="fig">Figure 3</xref>C.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Results of model discrimination and calibration for all task settings on the test data. These correspond to internal validation for PhysioNet 2012 Challenge and external for PhysioNet 2019 Challenge.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="160"/>
              <col width="210"/>
              <col width="210"/>
              <col width="210"/>
              <col width="210"/>
              <thead>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Masking (AUROC<sup>a</sup>), mean (SD)</td>
                  <td>Masking (Brier), mean (SD)</td>
                  <td>No masking (AUROC), mean (SD)</td>
                  <td>No masking (Brier), mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>P12<sup>b</sup> mortality</td>
                  <td>0.842 (0.82-0.86)</td>
                  <td>0.093 (0.087-0.100)</td>
                  <td>0.830 (0.81-0.85)</td>
                  <td>0.095 (0.088-0.101)</td>
                </tr>
                <tr valign="top">
                  <td>P12 LOS<sup>c</sup></td>
                  <td>0.814 (0.79-0.84)</td>
                  <td>0.054 (0.049-0.060)</td>
                  <td>0.737 (0.71-0.77)</td>
                  <td>0.064 (0.058-0.070)</td>
                </tr>
                <tr valign="top">
                  <td>P19<sup>d</sup> sepsis-overall</td>
                  <td>0.907 (0.90-0.92)</td>
                  <td>0.039 (0.036-0.041)</td>
                  <td>0.889 (0.88-0.90)</td>
                  <td>0.045 (0.043-0.048)</td>
                </tr>
                <tr valign="top">
                  <td>P19 sepsis-frequent</td>
                  <td>0.757 (0.74-0.77)</td>
                  <td>0.014 (0.013-0.014)</td>
                  <td>0.766 (0.75-0.78)</td>
                  <td>0.014 (0.013-0.015)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>AUROC: area under the curve of the receiver operating characteristic.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>P12: PhysioNet 2012 Challenge.</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>LOS: length of stay.</p>
              </fn>
              <fn id="table1fn4">
                <p><sup>d</sup>P19: PhysioNet 2019 Challenge.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Receiver operating characteristic (ROC) curve, precision-recall (PR) curve, and calibration plot for the PhysioNet 2012 Challenge mortality classification task.</p>
            </caption>
            <graphic xlink:href="medinform_v9i12e25022_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Receiver operating characteristic (ROC) curve, precision-recall (PR) curve, and calibration plot for the PhysioNet 2012 Challenge length of stay classification task.</p>
            </caption>
            <graphic xlink:href="medinform_v9i12e25022_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Receiver operating characteristic (ROC) curve, precision-recall (PR) curve, and calibration plot for the PhysioNet 2019 Challenge sepsis-overall classification task.</p>
            </caption>
            <graphic xlink:href="medinform_v9i12e25022_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Subgroup Analysis</title>
          <p><xref ref-type="table" rid="table2">Tables 2</xref>-<xref ref-type="table" rid="table4">4</xref> summarize model performances on the identified subgroups for the 3 overall classification task settings. For variance estimation in results, the subgroup data were bootstrapped keeping the sample size equal to subgroup size. These results have also been visualized as bar plots in Figures S12-S14 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
          <p>For the P12 mortality task in <xref ref-type="table" rid="table2">Table 2</xref>, the no masking model outperformed the masking model for the age bins 35 years and younger and 45 to 55 years, while the masking model had better performance for all other age groups. The best AUROC over all ages was achieved by the masking model on the 35- to 45-year group, which also saw the largest improvement on including IM features (2.6%). While younger and middle-aged groups saw inconsistent performance changes on IM inclusion, older patients (older than 55 years) showed consistent improvements from 0.8% to 1.5% in all-cause mortality classification. When considering performances in different ICUs, the masking model generally had better performance except for the coronary care unit (CCU), but the difference was not substantial. The cardiac surgery recovery unit saw the highest AUROC and also the greatest improvement of 1.7% on IM inclusion.</p>
          <p>Similar to the prominent improvements in the P12 LOS-overall classification task, the masking model considerably outperformed the no masking model for all age and ICU type subgroups. The youngest age group, 35 years and younger, saw an improvement of 15.5% in AUROC, becoming the subgroup with the best performance out of all age groups. Comparatively, the 55- to 65-year subgroup, which had the best model performance without IM, saw an improvement only of 0.7%. The cardiac surgery recovery unit again saw the largest performance gain on IM inclusion, of 13.1%, followed by the surgical ICU with 10.2% and the CCU, with a relatively small gain of 2.8%.</p>
          <p>Finally for the P19 sepsis-overall task, the masking model again outperformed all subgroups except for the 35- to 45-year bin. Older groups (older than 55 years) generally saw a larger improvement, with the greatest increase in AUROC seen in the 65- to 75-year group, at 4%. While the surgical and medical ICUs had the same AUROC without IM, the masking model performed better on the surgical ICU.</p>
          <p>Brier score trends generally showed similar or improved calibration on including IM features for all outcomes and subgroups. Particularly for P19 sepsis-overall, calibration improved despite external validation.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Subgroup analysis results for the PhysioNet 2012 Challenge mortality classification task.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="160"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">
                    <break/>
                  </td>
                  <td colspan="2">#Samples</td>
                  <td colspan="2">Masking (AUROC<sup>a</sup>), mean (SD)</td>
                  <td colspan="2">Masking (Brier), mean (SD)</td>
                  <td colspan="2">No masking (AUROC), mean (SD)</td>
                  <td>No masking (Brier), mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="12">
                    <bold>Age strata (years)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≤35</td>
                  <td colspan="2">268</td>
                  <td colspan="2">0.847 (0.74-0.93)</td>
                  <td colspan="2">0.057 (0.037-0.079)</td>
                  <td colspan="2">0.852 (0.75-0.94)</td>
                  <td colspan="2">0.059 (0.040-0.079)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>35-45</td>
                  <td colspan="2">309</td>
                  <td colspan="2">0.906 (0.84-0.96)</td>
                  <td colspan="2">0.048 (0.031-0.066)</td>
                  <td colspan="2">0.880 (0.80-0.95)</td>
                  <td colspan="2">0.054 (0.037-0.072)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>45-55</td>
                  <td colspan="2">569</td>
                  <td colspan="2">0.878 (0.82-0.93)</td>
                  <td colspan="2">0.064 (0.050-0.078)</td>
                  <td colspan="2">0.885 (0.83-0.93)</td>
                  <td colspan="2">0.064 (0.052-0.077)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>55-65</td>
                  <td colspan="2">708</td>
                  <td colspan="2">0.859 (0.82-0.90)</td>
                  <td colspan="2">0.074 (0.060-0.090)</td>
                  <td colspan="2">0.848 (0.80-0.89)</td>
                  <td colspan="2">0.076 (0.063-0.090)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>65-75</td>
                  <td colspan="2">845</td>
                  <td colspan="2">0.830 (0.79-0.87)</td>
                  <td colspan="2">0.094 (0.079-0.109)</td>
                  <td colspan="2">0.822 (0.78-0.86)</td>
                  <td colspan="2">0.094 (0.080-0.108)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>&#62;75</td>
                  <td colspan="2">1294</td>
                  <td colspan="2">0.801 (0.77-0.83)</td>
                  <td colspan="2">0.135 (0.121-0.149)</td>
                  <td colspan="2">0.786 (0.75-0.82)</td>
                  <td colspan="2">0.135 (0.123-0.149)</td>
                </tr>
                <tr valign="top">
                  <td colspan="12">
                    <bold>ICU<sup>b</sup> types</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Coronary care unit</td>
                  <td colspan="2">587</td>
                  <td colspan="2">0.806 (0.75-0.86)</td>
                  <td colspan="2">0.087 (0.069-0.106)</td>
                  <td colspan="2">0.807 (0.74-0.86)</td>
                  <td colspan="2">0.086 (0.070-0.104)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Cardiac surgery unit</td>
                  <td colspan="2">780</td>
                  <td colspan="2">0.862 (0.79-0.92)</td>
                  <td colspan="2">0.035 (0.025-0.046)</td>
                  <td colspan="2">0.845 (0.76-0.92)</td>
                  <td colspan="2">0.037 (0.028-0.048)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Surgical ICU</td>
                  <td colspan="2">1192</td>
                  <td colspan="2">0.852 (0.82-0.88)</td>
                  <td colspan="2">0.094 (0.082-0.107)</td>
                  <td colspan="2">0.843 (0.81-0.87)</td>
                  <td colspan="2">0.095 (0.083-0.106)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Medical ICU</td>
                  <td colspan="2">1434</td>
                  <td colspan="2">0.801 (0.77-0.83)</td>
                  <td colspan="2">0.128 (0.115-0.140)</td>
                  <td colspan="2">0.787 (0.76-0.82)</td>
                  <td colspan="2">0.129 (0.117-0.141)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>AUROC: area under the curve of the receiver operating characteristic.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>ICU: intensive care unit.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Subgroup analysis results for the PhysioNet 2012 Challenge length of stay classification task.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="160"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="180"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">
                    <break/>
                  </td>
                  <td colspan="2">#Samples</td>
                  <td>Masking (AUROC<sup>a</sup>), mean (SD)</td>
                  <td colspan="2">Masking (Brier), mean (SD)</td>
                  <td colspan="2">No masking (AUROC), mean (SD)</td>
                  <td>No masking (Brier), mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="11">
                    <bold>Age strata (years)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≤35</td>
                  <td colspan="2">268</td>
                  <td colspan="2">0.862 (0.80-0.92)</td>
                  <td>0.081 (0.055-0.109)</td>
                  <td colspan="2">0.707 (0.61-0.80)</td>
                  <td colspan="2">0.108 (0.079-0.138)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>35-45</td>
                  <td colspan="2">309</td>
                  <td colspan="2">0.820 (0.71-0.91)</td>
                  <td>0.060 (0.040-0.081)</td>
                  <td colspan="2">0.721 (0.62-0.82)</td>
                  <td colspan="2">0.079 (0.057-0.104)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>45-55</td>
                  <td colspan="2">569</td>
                  <td colspan="2">0.800 (0.72-0.88)</td>
                  <td>0.057 (0.042-0.073)</td>
                  <td colspan="2">0.712 (0.63-0.79)</td>
                  <td colspan="2">0.064 (0.048-0.081)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>55-65</td>
                  <td colspan="2">708</td>
                  <td colspan="2">0.797 (0.71-0.87)</td>
                  <td>0.045 (0.033-0.059)</td>
                  <td colspan="2">0.790 (0.72-0.86)</td>
                  <td colspan="2">0.054 (0.042-0.068)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>65-75</td>
                  <td colspan="2">845</td>
                  <td colspan="2">0.803 (0.72-0.87)</td>
                  <td>0.047 (0.035-0.060)</td>
                  <td colspan="2">0.712 (0.64-0.78)</td>
                  <td colspan="2">0.053 (0.042-0.065)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>&#62;75</td>
                  <td colspan="2">1294</td>
                  <td colspan="2">0.814 (0.77-0.86)</td>
                  <td>0.056 (0.046-0.067)</td>
                  <td colspan="2">0.747 (0.69-0.80)</td>
                  <td colspan="2">0.062 (0.052-0.073)</td>
                </tr>
                <tr valign="top">
                  <td colspan="11">
                    <bold>ICU<sup>b</sup> types</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Coronary care unit</td>
                  <td colspan="2">587</td>
                  <td colspan="2">0.791 (0.73-0.85)</td>
                  <td>0.086 (0.068-0.105)</td>
                  <td colspan="2">0.763 (0.71-0.82)</td>
                  <td colspan="2">0.095 (0.078-0.112)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Cardiac surgery unit</td>
                  <td colspan="2">780</td>
                  <td colspan="2">0.890 (0.77-0.98)</td>
                  <td>0.013 (0.006-0.020)</td>
                  <td colspan="2">0.759 (0.60-0.90)</td>
                  <td colspan="2">0.018 (0.011-0.025)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Surgical ICU</td>
                  <td colspan="2">1192</td>
                  <td colspan="2">0.812 (0.75-0.87)</td>
                  <td>0.046 (0.036-0.056)</td>
                  <td colspan="2">0.710 (0.64-0.77)</td>
                  <td colspan="2">0.056 (0.036-0.056)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Medical ICU</td>
                  <td colspan="2">1434</td>
                  <td colspan="2">0.776 (0.73-0.82)</td>
                  <td>0.071 (0.060-0.083)</td>
                  <td colspan="2">0.682 (0.63-0.73)</td>
                  <td colspan="2">0.082 (0.071-0.094)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>AUROC: area under the curve of the receiver operating characteristic.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>ICU: intensive care unit.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Subgroup analysis results for the PhysioNet 2019 Challenge sepsis-overall classification task. A total of 6095 patients did not have intensive care unit type specified, and thus, they were not considered for the corresponding analysis.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="160"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <col width="0"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">
                    <break/>
                  </td>
                  <td colspan="2">#Samples</td>
                  <td colspan="2">Masking (AUROC<sup>a</sup>), mean (SD)</td>
                  <td colspan="2">Masking (Brier), mean (SD)</td>
                  <td colspan="2">No masking (AUROC), mean (SD)</td>
                  <td>No masking (Brier), mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="12">
                    <bold>Age strata (years)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≤35</td>
                  <td colspan="2">1742</td>
                  <td colspan="2">0.904 (0.86-0.94)</td>
                  <td colspan="2">0.037 (0.029-0.045)</td>
                  <td colspan="2">0.893 (0.85-0.93)</td>
                  <td colspan="2">0.044 (0.035-0.052)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>35-45</td>
                  <td colspan="2">1949</td>
                  <td colspan="2">0.911 (0.88-0.94)</td>
                  <td colspan="2">0.041 (0.033-0.049)</td>
                  <td colspan="2">0.910 (0.88-0.94)</td>
                  <td colspan="2">0.046 (0.038-0.055)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>45-55</td>
                  <td colspan="2">3334</td>
                  <td colspan="2">0.920 (0.90-0.94)</td>
                  <td colspan="2">0.032 (0.026-0.037)</td>
                  <td colspan="2">0.900 (0.87-0.93)</td>
                  <td colspan="2">0.037 (0.032-0.043)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>55-65</td>
                  <td colspan="2">4581</td>
                  <td colspan="2">0.897 (0.87-0.92)</td>
                  <td colspan="2">0.042 (0.037-0.048)</td>
                  <td colspan="2">0.886 (0.86-0.91)</td>
                  <td colspan="2">0.048 (0.042-0.053)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>65-75</td>
                  <td colspan="2">4768</td>
                  <td colspan="2">0.917 (0.90-0.94)</td>
                  <td colspan="2">0.039 (0.034-0.043)</td>
                  <td colspan="2">0.877 (0.85-0.90)</td>
                  <td colspan="2">0.049 (0.043-0.054)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>&#62;75</td>
                  <td colspan="2">3626</td>
                  <td colspan="2">0.896 (0.87-0.92)</td>
                  <td colspan="2">0.040 (0.034-0.046)</td>
                  <td colspan="2">0.888 (0.86-0.91)</td>
                  <td colspan="2">0.045 (0.039-0.051)</td>
                </tr>
                <tr valign="top">
                  <td colspan="12">
                    <bold>ICU<sup>b</sup> types</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Medical ICU</td>
                  <td colspan="2">6923</td>
                  <td colspan="2">0.895 (0.88-0.91)</td>
                  <td colspan="2">0.044 (0.040-0.048)</td>
                  <td colspan="2">0.882 (0.86-0.90)</td>
                  <td colspan="2">0.049 (0.045-0.053)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Surgical ICU</td>
                  <td colspan="2">6982</td>
                  <td colspan="2">0.903 (0.89-0.92)</td>
                  <td colspan="2">0.041 (0.037-0.045)</td>
                  <td colspan="2">0.882 (0.86-0.90)</td>
                  <td colspan="2">0.050 (0.046-0.055)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>AUROC: area under the curve of the receiver operating characteristic.</p>
              </fn>
              <fn id="table4fn2">
                <p><sup>b</sup>ICU: intensive care unit.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Simulated Prospective Classification</title>
        <p>The last row of <xref ref-type="table" rid="table1">Table 1</xref> summarizes the nontemporal evaluation for this task setting. Unlike overall classification, the no masking model outperforms the masking model while keeping almost the same calibration.</p>
        <p>Before discussing temporal performances, it is necessary to understand the LOS distribution for each patient category. LOS averaged over the entire cohort was very similar for both P19 hospitals, at 39.77 (SD 22.55) hours and 38.23 (SD 23.27) hours for A and B, respectively. Separating the cohort into patients who eventually develop sepsis and those who don’t shows that patients who develop sepsis spend a longer time in the ICU. For hospital A, septic patients spent 59.54 (SD 57.81) hours on average while nonseptic patients spent 37.87 (SD 13.92) hours. Similarly, for hospital B this was 59.22 (SD 61.90) hours for septic patients and 36.96 (SD 17.72) hours for nonseptic patients. The cohort for both hospitals consisted almost entirely of patients with sepsis after 3 days.</p>
        <p>Temporal evaluation shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>B displays almost equal predictive value at each hour over the first 100 hours of ICU admission, with peak predictive value achieved a little over 90 hours. This is likely due to the LOS characteristics of the datasets. <xref rid="figure4" ref-type="fig">Figure 4</xref>A shows how model predictions change over time for patients who eventually develop sepsis and those who don’t. We observe a considerable divergence between the curves of masking and no masking models (regardless of sepsis category) a little after 2 days of ICU admission. The same plot also shows trends in the proportion of septic patients at each hour, giving an insight into the expected amount of false alarms or missed diagnoses by each model.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Temporal evaluation for the PhysioNet 2019 Challenge sepsis-frequent task; records corresponding to sepsis are labeled as S=1 while the remainder are S=0: (A) drop in probability of false-positive prediction (S=0) is because after 90 hours, only patients with sepsis remain in the data; (B) this cohort characteristic is learned by the model resulting in perfect predictive value after 90 hours. ICU: intensive care unit.</p>
          </caption>
          <graphic xlink:href="medinform_v9i12e25022_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Results from the retrospective-overall classification shown in <xref ref-type="table" rid="table1">Table 1</xref> were consistent with previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], confirming that including even simple representations of health care processes like binary IM features improves performance. This was further reinforced by evaluating the models on a variety of metrics summarizing predictive value and calibration. Model discrimination and predictive value were improved in all cases while keeping the same or better calibration. Results of the P19 sepsis-overall task also confirmed that model generalization in such retrospective tasks is not affected by including IM features, despite interhospital variations. Calibration plots in panel C of <xref rid="figure1" ref-type="fig">Figures 1</xref>-<xref rid="figure3" ref-type="fig">3</xref> showed that model reliability was improved for nearly all levels of model certainty, especially for higher predicted probabilities, making the masking model more trustworthy.</p>
        <p>Subgroup analysis helped us verify the IM inclusion effect on population subgroups and whether health care process variables encoded information about pathophysiology despite intra- and interhospital variations, justifying their use as proxy biomarkers of patient health. In the P12 mortality subgroup task (<xref ref-type="table" rid="table2">Table 2</xref>), while the masking model performed better on average in the entire test set, it failed to improve upon the no masking model for certain age groups suggesting that for younger patients, trends in physiological features alone are better predictors of in-hospital death. The masking model was also slightly outperformed by the no masking model in the CCU subgroup, which may be because CCU patients have a very specific set of complications, rendering several laboratory tests unnecessary [<xref ref-type="bibr" rid="ref48">48</xref>]. For subgroups in P12 LOS (<xref ref-type="table" rid="table3">Table 3</xref>), however, considerable improvements in AUROC for younger age groups were observed, suggesting laboratory tests conducted were important indicators to estimate whether a patient will spend more or less than 3 days in the ICU. The CCU again saw only a slight improvement, probably due to a generally earlier diagnosis relative to other ICUs. Overall, for both P12 outcomes, younger age groups and the cardiac surgery recovery unit had the highest AUROCs achieved by masking models.</p>
        <p>For subgroups in the P19 sepsis-overall task (<xref ref-type="table" rid="table4">Table 4</xref>), older age groups generally saw greater benefit on IM inclusion. Sepsis is known to be associated with age, which may in turn prompt physicians to order relevant tests earlier in the patient’s ICU stay [<xref ref-type="bibr" rid="ref49">49</xref>]. The surgical ICU again saw a greater improvement in AUROC over the medical ICU, while the model had almost equal performance for both ICUs using only physiological features. This task also evaluated model performance and effect of IM features on model generalization, since the subgroups were made using data from a distinct hospital. These results suggest that, at least in retrospective task settings, health care process variables do not hinder model generalization and models trained using these variables can adequately learn the relation of IM features to the underlying condition without being affected by interhospital variations.</p>
        <p>Calibration indicated by the Brier score showed that the model actually learns to output better probabilities on including health care process variables.</p>
      </sec>
      <sec>
        <title>Relationship With Prior Work</title>
        <p>Perhaps the study most similar to this work was by Sharafoddini et al [<xref ref-type="bibr" rid="ref50">50</xref>], which examined whether missing indicator features are informative. The study performed extensive data analysis and evaluated logistic regression and tree-based models trained with and without missing indicators to assess any difference in discriminative ability. Their results demonstrated improved model performance upon IM inclusion, and feature selection methods reinforced the importance of IM variables. While this work is similarly motivated in its goal to objectively assess IM features, there are some essential differences. We focused on several outcomes of interest as opposed to mortality only, as discussed earlier. We also provided comprehensive evaluation through multiple metrics, assessing not only overall discrimination but also hourly discrimination and model calibration. Subgroup analysis and evaluation of model generalization on a distinct patient population further contribute to the novelty of this work. Previous studies did not evaluate their model’s performance on ICU population subgroups, instead assuming similar performances across patients [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. We showed that discrimination varies between strata as does the extent of improvement brought by including IM features. Finally, we used a sequential deep learning model (GRU) as opposed to the models used in Sharafoddini et al [<xref ref-type="bibr" rid="ref50">50</xref>], since RNN variants have been popular choices to model EHR data and often use IM features to improve performances [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Temporal trends in probability of predicting sepsis shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>A confirm previous findings by Sharafoddini et al [<xref ref-type="bibr" rid="ref50">50</xref>] that indicators become increasingly important from the second day onward in the ICU. But this is arguably too late, since patients who eventually developed sepsis had a higher variance in LOS, many becoming septic early on in their ICU stay. While including IM features results in better model performance overall, it also falsely identifies nonsepsis patients as susceptible (false positives) in the near future, leading to several false alarms. In the PhysioNet 2019 Challenge, the utility score metric applied a minimal penalty for false positive predictions, while also leading to earlier and greater true positives, perhaps explaining the extensive use of IM features in proposed models. But alarm fatigue is a known issue in ICU early warning scores, and false positives cannot be ignored [<xref ref-type="bibr" rid="ref51">51</xref>]. When performance on predicting the absence of sepsis (true negatives) is not considered, the net predictive value gets balanced out, as shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>B. Also, unlike previous studies, which relied on end-of-day outcome prediction or thresholded decision outputs for evaluation, we relied exclusively on hourly probabilities and visualized its trends with time, which may be used to understand a model’s clinical utility more comprehensively [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref42">42</xref>].</p>
        <p>It is important to understand that IM feature effectiveness varies based on the outcome of interest, whether they are applied for retrospective or prospective tasks and even on population subgroups. With IM features now being used for a variety of tasks including classification, prediction, and even imputation, models relying on these may further propagate preexisting biases in health care processes.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>A limitation of this study was using data from the same country, in this case the United States. Practices and case-mix vary by country. Physician attitudes to uncertainty (which may influence test ordering and drug prescription) may also be affected by resource limitations and even by cultural factors [<xref ref-type="bibr" rid="ref24">24</xref>]. This requires verifying masking model generalizability on data from different parts of the world. Efforts have been made to standardize test ordering behavior but guidelines are followed to varying extents depending on patient histories, comorbidities, and the physician in charge [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref52">52</xref>].</p>
        <p>The datasets we used were observational, with no information regarding the context in which laboratory tests were ordered or which patients were transfers from other ICUs. The latter leads to the problem of lead-time bias, which may be reflected in the data as unexpected adverse outcomes for certain patients [<xref ref-type="bibr" rid="ref53">53</xref>]. We also evaluated IM feature effectiveness on only one model type, GRU (an RNN variant). While we selected this because of its common use in prior work, different models may learn IM representations differently [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
        <p>Critical care EHRs are also a specific subtype of general EHRs, since they consists only of inpatients with serious conditions. A more general EHR dataset that includes outpatients may result in different health care process observation patterns and reveal interesting effects on predictive models [<xref ref-type="bibr" rid="ref23">23</xref>]. Finally, clinical best practices change over time, in turn affecting which tests are performed and how often. This is part of the larger problem of dataset shift in machine learning, and it remains to be seen how this would affect clinical models relying on health care process features.</p>
      </sec>
      <sec>
        <title>Conclusion and Future Work</title>
        <p>With increasing use of observational EHR data for machine learning model development, there has been an increase in the number of studies claiming clinical utility of proposed models, many relying on variables representative of health care processes. In this study, we addressed questions regarding the effect of using health care process features on machine learning model performance and generalizability. By separating commonly used task settings into 2 subtypes, retrospective and (simulated) prospective, we made an important distinction concerning possible clinical utility of models. We framed all our results using multiple evaluation metrics while also analyzing external validation performances for all tasks by using data from a geographically distinct hospital.</p>
        <p>This study demonstrated the usefulness of IM features in retrospective task settings on various outcome labels. Notably, we found that machine learning model generalization and calibration are not adversely affected on using health care process variables even when externally evaluated. However, the extent of improvement may depend on different patient and in-hospital factors such as age or ICU type. Our research indicated that these features provide better information for certain subgroups than others, and IM variables are better predictors of administrative outcomes like length of stay than mortality or sepsis. Results also showed that, at least for a sequential deep learning model, using simple binary missingness indicators for simulated prospective sepsis classification did not add any benefit over a model relying on patient pathological features only.</p>
        <p>Our findings suggest that the suitability of using IM features in machine learning models may vary based on the outcome of interest, subgroup of application, task setting (retrospective or prospective), and differences in clinical practice between training data and test data. Class imbalances and nature of outcome have an intense impact on expected performance improvements on IM feature inclusion. In application, the subgroup of a patient and deviation in model performance from its expectation also need to be considered while estimating the uncertainty of a prediction. Also, while ultimately machine learning models aim to lend themselves to use as continuous monitoring bedside tools, using IM features does not seem to add any prominent improvement over not using them in that setting. Finally, using IM means using clinical practice variables in a model, so different missingness rates and missingness patterns need to be properly contextualized to understand model performance differences between train and test environments. Biased observations in one dataset (due to practice or even hospital resource variations) may have a substantial effect on model discriminations and calibration in another dataset.</p>
        <p>There are several ways to extend this study. Future work may (1) focus on verifying model performance and generalization changes by using data from multiple countries, (2) focus on using different types of models and analyze how differently learned representations of missingness affect performance, or (3) study how health care process features may be used for multilabel classification.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Description of the sepsis label in PhysioNet 2019 Challenge.</p>
        <media xlink:href="medinform_v9i12e25022_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 46 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Further data and result analysis.</p>
        <media xlink:href="medinform_v9i12e25022_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 3113 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the curve of the receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CCU</term>
          <def>
            <p>coronary care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">GRU</term>
          <def>
            <p>gated recurrent unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ICU</term>
          <def>
            <p>intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">IM</term>
          <def>
            <p>informative missingness</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">LOS</term>
          <def>
            <p>length of stay</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MIMIC II</term>
          <def>
            <p>Multiparameter Intelligent Monitoring in Intensive Care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">P12</term>
          <def>
            <p>PhysioNet 2012 Challenge dataset</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">P19</term>
          <def>
            <p>PhysioNet 2019 Challenge dataset</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">RNN</term>
          <def>
            <p>recurrent neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">Sepsis-3</term>
          <def>
            <p>Third International Consensus Definitions for Sepsis and Septic Shock</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>The authors have applied for a related patent (Japanese patent application number 2019-164443).</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pimentel</surname>
              <given-names>MAF</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Clifton</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A multivariate timeseries modeling approach to severity of illness assessment and forecasting in ICU with sparse, heterogeneous clinical data</article-title>
          <source>Proc Conf AAAI Artif Intell</source>
          <year>2015</year>
          <month>01</month>
          <volume>2015</volume>
          <fpage>446</fpage>
          <lpage>453</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27182460"/>
          </comment>
          <pub-id pub-id-type="medline">27182460</pub-id>
          <pub-id pub-id-type="pmcid">PMC4864016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bahadori</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Deep computational phenotyping</article-title>
          <source>Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2015</year>
          <fpage>507</fpage>
          <lpage>516</lpage>
          <pub-id pub-id-type="doi">10.1145/2783258.2783365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sturm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Intelligible models for healthcare: predicting pneumonia risk and hospital 30-day readmission</article-title>
          <source>Proceedings of the 21th ACM SIGKDD international conference on knowledge discovery and data mining</source>
          <year>2015</year>
          <fpage>1721</fpage>
          <lpage>1730</lpage>
          <pub-id pub-id-type="doi">10.1145/2783258.2788613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hug</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>ICU acuity: real-time models versus daily models</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2009</year>
          <month>11</month>
          <day>14</day>
          <volume>2009</volume>
          <fpage>260</fpage>
          <lpage>264</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20351861"/>
          </comment>
          <pub-id pub-id-type="medline">20351861</pub-id>
          <pub-id pub-id-type="pmcid">PMC2815497</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tighe</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bihorac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Deep EHR: a survey of recent advances in deep learning techniques for electronic health record (EHR) analysis</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2018</year>
          <month>12</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>1589</fpage>
          <lpage>1604</lpage>
          <pub-id pub-id-type="doi">10.1109/JBHI.2017.2767063</pub-id>
          <pub-id pub-id-type="medline">29989977</pub-id>
          <pub-id pub-id-type="pmcid">PMC6043423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Loftus</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Adhikari</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ozrazgat-Baslanti</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bihorac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>DeepSOFA: a continuous acuity score for critically ill patients using clinically interpretable deep learning</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>02</month>
          <day>12</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>1879</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-019-38491-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-019-38491-0</pub-id>
          <pub-id pub-id-type="medline">30755689</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-019-38491-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6372608</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lasko</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Computational phenotype discovery using unsupervised feature learning over noisy, sparse, and irregular clinical data</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>6</issue>
          <fpage>e66341</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0066341"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0066341</pub-id>
          <pub-id pub-id-type="medline">23826094</pub-id>
          <pub-id pub-id-type="pii">PONE-D-12-40629</pub-id>
          <pub-id pub-id-type="pmcid">PMC3691199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Azur</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stuart</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Frangakis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Leaf</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Multiple imputation by chained equations: what is it and how does it work?</article-title>
          <source>Int J Methods Psychiatr Res</source>
          <year>2011</year>
          <month>03</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21499542"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/mpr.329</pub-id>
          <pub-id pub-id-type="medline">21499542</pub-id>
          <pub-id pub-id-type="pmcid">PMC3074241</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yitan</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>BRITS: Bidirectional recurrent imputation for time series</article-title>
          <source>Adv Neural Inf Proc Syst</source>
          <year>2018</year>
          <fpage>6775</fpage>
          <lpage>6785</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://papers.neurips.cc/paper/7911-brits-bidirectional-recurrent-imputation-for-time-series.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Inference and missing data</article-title>
          <source>Biometrika</source>
          <year>1976</year>
          <volume>63</volume>
          <issue>3</issue>
          <fpage>581</fpage>
          <lpage>592</lpage>
          <pub-id pub-id-type="doi">10.1093/biomet/63.3.581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Exploiting missing clinical data in Bayesian network modeling for predicting medical problems</article-title>
          <source>J Biomed Inform</source>
          <year>2008</year>
          <month>02</month>
          <volume>41</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>14</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(07)00052-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2007.06.001</pub-id>
          <pub-id pub-id-type="medline">17625974</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(07)00052-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De Brouwer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Simm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Arany</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Gru-ode-bayes: continuous modeling of sporadically-observed time series</article-title>
          <source>Adv Neural Inf Proc Syst</source>
          <year>2019</year>
          <fpage>7379</fpage>
          <lpage>7390</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lipton</surname>
              <given-names>ZC</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Wetzel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Modeling missing data in clinical time series with RNNs</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online June 13, 2016.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1606.04130.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Purushotham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Recurrent neural networks for multivariate time series with missing values</article-title>
          <source>Sci Rep</source>
          <year>2018</year>
          <month>04</month>
          <day>17</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>6085</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/s41598-018-24271-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-24271-9</pub-id>
          <pub-id pub-id-type="medline">29666385</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-24271-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5904216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Øyvind Mikalsen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Soguero-Ruiz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Maria Bianchi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Revhaug</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jenssen</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Time series cluster kernels to exploit informative missingness and incomplete label information</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on July 10, 2019</comment>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2021.107896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Janmajay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kentaro</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Raghava</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Masahiro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tomoko</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Noriji</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Utilizing informative missingness for early prediction of sepsis</article-title>
          <source>Comput Cardiol</source>
          <year>2019</year>
          <fpage>1</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.22489/cinc.2019.280</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morrill</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kormilitzin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nevado-Holgado</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Swaminathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Howison</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The signature-based model for early detection of sepsis from electronic health records in the intensive care unit</article-title>
          <source>Comput Cardiol</source>
          <year>2019</year>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.22489/cinc.2019.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zabihi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kiranyaz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gabbouj</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Sepsis prediction in intensive care unit using ensemble of xgboost models</article-title>
          <source>Comput Cardiol</source>
          <year>2019</year>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.22489/cinc.2019.238</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kristiansen</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Hjortdahl</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The general practitioner and laboratory utilization: why does it vary?</article-title>
          <source>Fam Pract</source>
          <year>1992</year>
          <month>03</month>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1093/fampra/9.1.22</pub-id>
          <pub-id pub-id-type="medline">1634022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Sick patients have more data: the non-random completeness of electronic health records</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2013</year>
          <volume>2013</volume>
          <fpage>1472</fpage>
          <lpage>1477</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24551421"/>
          </comment>
          <pub-id pub-id-type="medline">24551421</pub-id>
          <pub-id pub-id-type="pmcid">PMC3900159</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Hidden in plain sight: bias towards sick patients when sampling patients with sufficient electronic health record data for research</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2014</year>
          <month>06</month>
          <day>11</day>
          <volume>14</volume>
          <fpage>51</fpage>
          <pub-id pub-id-type="doi">10.1186/1472-6947-14-51</pub-id>
          <pub-id pub-id-type="medline">24916006</pub-id>
          <pub-id pub-id-type="pii">1472-6947-14-51</pub-id>
          <pub-id pub-id-type="pmcid">PMC4062889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agniel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>GM</given-names>
            </name>
          </person-group>
          <article-title>Biases in electronic health record data due to processes within the healthcare system: retrospective observational study</article-title>
          <source>BMJ</source>
          <year>2018</year>
          <month>04</month>
          <day>30</day>
          <volume>361</volume>
          <fpage>k1479</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=29712648"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.k1479</pub-id>
          <pub-id pub-id-type="medline">29712648</pub-id>
          <pub-id pub-id-type="pmcid">PMC5925441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pivovarov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Albers</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sepulveda</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Identifying and mitigating biases in EHR laboratory tests</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <month>10</month>
          <volume>51</volume>
          <fpage>24</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00084-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2014.03.016</pub-id>
          <pub-id pub-id-type="medline">24727481</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(14)00084-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC4194228</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zaat</surname>
              <given-names>JO</given-names>
            </name>
            <name name-style="western">
              <surname>van Eijk</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>General practitioners' uncertainty, risk preference, and use of laboratory tests</article-title>
          <source>Med Care</source>
          <year>1992</year>
          <month>09</month>
          <volume>30</volume>
          <issue>9</issue>
          <fpage>846</fpage>
          <lpage>854</lpage>
          <pub-id pub-id-type="doi">10.1097/00005650-199209000-00008</pub-id>
          <pub-id pub-id-type="medline">1518316</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leurquin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Van Casteren</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>De Maeseneer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Use of blood tests in general practice: a collaborative study in eight European countries. Eurosentinel Study Group</article-title>
          <source>Br J Gen Pract</source>
          <year>1995</year>
          <month>01</month>
          <volume>45</volume>
          <issue>390</issue>
          <fpage>21</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bjgp.org/cgi/pmidlookup?view=long&#38;pmid=7779470"/>
          </comment>
          <pub-id pub-id-type="medline">7779470</pub-id>
          <pub-id pub-id-type="pmcid">PMC1239108</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freedman</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Towards better test utilization: strategies to improve physician ordering and their impact on patient outcomes</article-title>
          <source>Electr J Int Fed Clin Chem</source>
          <year>2015</year>
          <month>01</month>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27683478"/>
          </comment>
          <pub-id pub-id-type="medline">27683478</pub-id>
          <pub-id pub-id-type="pmcid">PMC4975220</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Hager</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Pronovost</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Saria</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A targeted real-time early warning score (TREWScore) for septic shock</article-title>
          <source>Sci Transl Med</source>
          <year>2015</year>
          <month>08</month>
          <day>5</day>
          <volume>7</volume>
          <issue>299</issue>
          <fpage>299ra122</fpage>
          <pub-id pub-id-type="doi">10.1126/scitranslmed.aab3719</pub-id>
          <pub-id pub-id-type="medline">26246167</pub-id>
          <pub-id pub-id-type="pii">7/299/299ra122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Futoma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hariharan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sendak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brajer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Clement</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bedoya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Heller</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>An improved multi-output gaussian process rnn with real-time validation for early sepsis detection</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on August 19, 2017.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1708.05894.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reyna</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Josef</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Jeter</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shashikumar</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Westover</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Nemati</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Early prediction of sepsis from clinical data: the PhysioNet/Computing in Cardiology Challenge 2019</article-title>
          <source>Crit Care Med</source>
          <year>2020</year>
          <month>02</month>
          <volume>48</volume>
          <issue>2</issue>
          <fpage>210</fpage>
          <lpage>217</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31939789"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000004145</pub-id>
          <pub-id pub-id-type="medline">31939789</pub-id>
          <pub-id pub-id-type="pii">00003246-202002000-00010</pub-id>
          <pub-id pub-id-type="pmcid">PMC6964870</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vollmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Luz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sodmann</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sinha</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>SO</given-names>
            </name>
          </person-group>
          <article-title>Time-specific metalearners for the early prediction of sepsis</article-title>
          <source>Comput Cardiol</source>
          <year>2019</year>
          <fpage>1</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.22489/cinc.2019.029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boverman</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A multi-task imputation and classification neural architecture for early prediction of sepsis from multivariate clinical time series</article-title>
          <source>Comput Cardiol</source>
          <year>2019</year>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.22489/cinc.2019.110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Relationships among patient age, diagnosis, hospital type, and clinical laboratory utilization</article-title>
          <source>Clin Lab Sci</source>
          <year>2005</year>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="medline">15747782</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gershengorn</surname>
              <given-names>HB</given-names>
            </name>
            <name name-style="western">
              <surname>Garland</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Patterns of daily costs differ for medical and surgical intensive care unit patients</article-title>
          <source>Ann Am Thorac Soc</source>
          <year>2015</year>
          <month>12</month>
          <volume>12</volume>
          <issue>12</issue>
          <fpage>1831</fpage>
          <lpage>1836</lpage>
          <pub-id pub-id-type="doi">10.1513/AnnalsATS.201506-366BC</pub-id>
          <pub-id pub-id-type="medline">26393984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>Predicting in-hospital mortality of ICU patients: the PhysioNet/Computing in Cardiology Challenge 2012</article-title>
          <source>Comput Cardiol</source>
          <year>2012</year>
          <volume>39</volume>
          <fpage>245</fpage>
          <lpage>248</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24678516"/>
          </comment>
          <pub-id pub-id-type="medline">24678516</pub-id>
          <pub-id pub-id-type="pmcid">PMC3965265</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Villarroel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Reisner</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Heldt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kyaw</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>Multiparameter Intelligent Monitoring in Intensive Care II: a public-access intensive care unit database</article-title>
          <source>Crit Care Med</source>
          <year>2011</year>
          <month>05</month>
          <volume>39</volume>
          <issue>5</issue>
          <fpage>952</fpage>
          <lpage>960</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21283005"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0b013e31820a92c6</pub-id>
          <pub-id pub-id-type="medline">21283005</pub-id>
          <pub-id pub-id-type="pmcid">PMC3124312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Deutschman</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Seymour</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Shankar-Hari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Annane</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bellomo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bernard</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Chiche</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Coopersmith</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Hotchkiss</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Opal</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Rubenfeld</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>van</surname>
              <given-names>DPT</given-names>
            </name>
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Angus</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>The Third International Consensus Definitions for Sepsis and Septic Shock (Sepsis-3)</article-title>
          <source>JAMA</source>
          <year>2016</year>
          <month>02</month>
          <day>23</day>
          <volume>315</volume>
          <issue>8</issue>
          <fpage>801</fpage>
          <lpage>810</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2016.0287</pub-id>
          <pub-id pub-id-type="medline">26903338</pub-id>
          <pub-id pub-id-type="pii">2492881</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lipton</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Elkan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wetzel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Learning to diagnose with lstm recurrent neural networks</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on November 11, 2015.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1511.03677.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Opportunities and challenges in developing deep learning models using electronic health records data: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>10</month>
          <day>01</day>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>1419</fpage>
          <lpage>1428</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29893864"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy068</pub-id>
          <pub-id pub-id-type="medline">29893864</pub-id>
          <pub-id pub-id-type="pii">5035024</pub-id>
          <pub-id pub-id-type="pmcid">PMC6188527</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>van Merrienboer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gulcehre</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bahdanau</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Learning phrase representations using rnn encoder-decoder for statistical machine translation</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on June 3, 2014</comment>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1179</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Larochelle</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Beygelzimer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>d'Alché-Buc</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Pytorch: an imperative style, high-performance deep learning library</article-title>
          <source>Adv Neural Inf Proc Syst</source>
          <year>2019</year>
          <publisher-loc>Red Hook</publisher-loc>
          <publisher-name>Curran Associates, Inc</publisher-name>
          <fpage>8024</fpage>
          <lpage>8034</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kingma</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ba</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Adam: a method for stochastic optimization</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on December 22, 2014.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1412.6980.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meiring</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dixit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>MacCallum</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Brealey</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Watkinson</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ashworth</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Beale</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ercole</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Optimal intensive care outcome prediction over time using machine learning</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>11</issue>
          <fpage>e0206862</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0206862</pub-id>
          <pub-id pub-id-type="medline">30427913</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-23147</pub-id>
          <pub-id pub-id-type="pmcid">PMC6241126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maslove</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>With severity scores updated on the hour, data science inches closer to the bedside</article-title>
          <source>Crit Care Med</source>
          <year>2018</year>
          <month>03</month>
          <volume>46</volume>
          <issue>3</issue>
          <fpage>480</fpage>
          <lpage>481</lpage>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000002945</pub-id>
          <pub-id pub-id-type="medline">29474330</pub-id>
          <pub-id pub-id-type="pii">00003246-201803000-00020</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leisman</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Rare events in the ICU: an emerging challenge in classification and prediction</article-title>
          <source>Crit Care Med</source>
          <year>2018</year>
          <month>03</month>
          <volume>46</volume>
          <issue>3</issue>
          <fpage>418</fpage>
          <lpage>424</lpage>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000002943</pub-id>
          <pub-id pub-id-type="medline">29474323</pub-id>
          <pub-id pub-id-type="pii">00003246-201803000-00010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ozenne</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Subtil</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Maucort-Boulch</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The precision-recall curve overcame the optimism of the receiver operating characteristic curve in rare diseases</article-title>
          <source>J Clin Epidemiol</source>
          <year>2015</year>
          <month>08</month>
          <volume>68</volume>
          <issue>8</issue>
          <fpage>855</fpage>
          <lpage>859</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2015.02.010</pub-id>
          <pub-id pub-id-type="medline">25881487</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(15)00106-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ovadia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fertig</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Can you trust your model's uncertainty? Evaluating predictive uncertainty under dataset shift</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on June 6, 2019.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1906.02530.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Turck</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hainard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tiberti</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lisacek</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>pROC: an open-source package for R and S+ to analyze and compare ROC curves</article-title>
          <source>BMC Bioinformatics</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>77</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-12-77"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-12-77</pub-id>
          <pub-id pub-id-type="medline">21414208</pub-id>
          <pub-id pub-id-type="pii">1471-2105-12-77</pub-id>
          <pub-id pub-id-type="pmcid">PMC3068975</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>IA</given-names>
            </name>
          </person-group>
          <article-title>Cardiology's 10 greatest discoveries of the 20th century</article-title>
          <source>Tex Heart Inst J</source>
          <year>2002</year>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>164</fpage>
          <lpage>171</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12224718"/>
          </comment>
          <pub-id pub-id-type="medline">12224718</pub-id>
          <pub-id pub-id-type="pmcid">PMC124754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Angus</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Linde-Zwirble</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Lidicker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Clermont</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Carcillo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pinsky</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Epidemiology of severe sepsis in the United States: analysis of incidence, outcome, and associated costs of care</article-title>
          <source>Crit Care Med</source>
          <year>2001</year>
          <month>07</month>
          <volume>29</volume>
          <issue>7</issue>
          <fpage>1303</fpage>
          <lpage>1310</lpage>
          <pub-id pub-id-type="doi">10.1097/00003246-200107000-00002</pub-id>
          <pub-id pub-id-type="medline">11445675</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharafoddini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dubin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Maslove</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A new insight into missing data in intensive care unit patient profiles: observational study</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>01</month>
          <day>08</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e11605</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/1/e11605/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11605</pub-id>
          <pub-id pub-id-type="medline">30622091</pub-id>
          <pub-id pub-id-type="pii">v7i1e11605</pub-id>
          <pub-id pub-id-type="pmcid">PMC6329436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AEW</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Nemati</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Niehaus</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Clifton</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and decision support in critical care</article-title>
          <source>Proc IEEE Inst Electr Electron Eng</source>
          <year>2016</year>
          <month>02</month>
          <volume>104</volume>
          <issue>2</issue>
          <fpage>444</fpage>
          <lpage>466</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27765959"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/JPROC.2015.2501978</pub-id>
          <pub-id pub-id-type="medline">27765959</pub-id>
          <pub-id pub-id-type="pmcid">PMC5066876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Hashimoto</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Daltroy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Techniques to improve physicians' use of diagnostic tests: a new conceptual framework</article-title>
          <source>JAMA</source>
          <year>1998</year>
          <month>12</month>
          <day>16</day>
          <volume>280</volume>
          <issue>23</issue>
          <fpage>2020</fpage>
          <lpage>2027</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.280.23.2020</pub-id>
          <pub-id pub-id-type="medline">9863854</pub-id>
          <pub-id pub-id-type="pii">jrv80056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dragsted</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jörgensen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Bönsing</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobsen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Knaus</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Qvist</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Interhospital comparisons of patient outcome from intensive care: importance of lead-time bias</article-title>
          <source>Crit Care Med</source>
          <year>1989</year>
          <month>05</month>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>418</fpage>
          <lpage>422</lpage>
          <pub-id pub-id-type="doi">10.1097/00003246-198905000-00008</pub-id>
          <pub-id pub-id-type="medline">2707011</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
