<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e11605</article-id>
      <article-id pub-id-type="pmid">30622091</article-id>
      <article-id pub-id-type="doi">10.2196/11605</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A New Insight Into Missing Data in Intensive Care Unit Patient Profiles: Observational Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Zhou</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Tingay</surname>
            <given-names>Karen</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1">
          <name name-style="western">
            <surname>Sharafoddini</surname>
            <given-names>Anis</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4231-8116</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Dubin</surname>
            <given-names>Joel A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9863-7752</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3">
          <name name-style="western">
            <surname>Maslove</surname>
            <given-names>David M</given-names>
          </name>
          <degrees>MD, MS, FRCPC</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0765-7158</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4" corresp="yes">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Joon</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Department of Community Health Sciences</institution>
            <institution>Cumming School of Medicine</institution>
            <institution>University of Calgary</institution>
            <addr-line>3280 Hospital Drive Northwest</addr-line>
            <addr-line>Calgary, AB, T2N 4Z6</addr-line>
            <country>Canada</country>
            <phone>1 403 220 2968</phone>
            <email>joonwu.lee@ucalgary.ca</email>
          </address>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8593-9321</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Health Data Science Lab</institution>
        <institution>School of Public Health and Health Systems</institution>
        <institution>University of Waterloo</institution>
        <addr-line>Waterloo, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Statistics and Actuarial Science</institution>
        <institution>University of Waterloo</institution>
        <addr-line>Waterloo, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Critical Care Medicine</institution>
        <institution>Queen's University</institution>
        <addr-line>Kingston, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Community Health Sciences</institution>
        <institution>Cumming School of Medicine</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Cardiac Sciences</institution>
        <institution>Cumming School of Medicine</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Joon Lee 
      <email>joonwu.lee@ucalgary.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Mar</season>
        <year>2019</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>08</day>
        <month>01</month>
        <year>2019</year>
      </pub-date>
      <volume>7</volume>
      <issue>1</issue>
      <elocation-id>e11605</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>17</day>
          <month>7</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>8</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="accepted">
          <day>30</day>
          <month>10</month>
          <year>2018</year>
        </date>
      </history>
      <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
      <copyright-statement>©Anis Sharafoddini, Joel A Dubin, David M Maslove, Joon Lee. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 08.01.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2019/1/e11605/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The data missing from patient profiles in intensive care units (ICUs) are substantial and unavoidable. However, this incompleteness is not always random or because of imperfections in the data collection process.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to investigate the potential hidden information in data missing from electronic health records (EHRs) in an ICU and examine whether the presence or missingness of a variable itself can convey information about the patient health status.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Daily retrieval of laboratory test (LT) measurements from the Medical Information Mart for Intensive Care III database was set as our reference for defining complete patient profiles. <italic>Missingness indicators</italic> were introduced as a way of representing presence or absence of the LTs in a patient profile. Thereafter, various feature selection methods (filter and embedded feature selection methods) were used to examine the predictive power of missingness indicators. Finally, a set of well-known prediction models (logistic regression [LR], decision tree, and random forest) were used to evaluate whether the absence status itself of a variable recording can provide predictive power. We also examined the utility of missingness indicators in improving predictive performance when used with observed laboratory measurements as model input. The outcome of interest was in-hospital mortality and mortality at 30 days after ICU discharge.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Regardless of mortality type or ICU day, more than 40% of the predictors selected by feature selection methods were missingness indicators. Notably, employing missingness indicators as the only predictors achieved reasonable mortality prediction on all days and for all mortality types (for instance, in 30-day mortality prediction with LR, we achieved area under the curve of the receiver operating characteristic [AUROC] of 0.6836±0.012). Including indicators with observed measurements in the prediction models also improved the AUROC; the maximum improvement was 0.0426. Indicators also improved the AUROC for Simplified Acute Physiology Score II model—a well-known ICU severity of illness score—confirming the additive information of the indicators (AUROC of 0.8045±0.0109 for 30-day mortality prediction for LR).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study demonstrated that the presence or absence of LT measurements is informative and can be considered a potential predictor of in-hospital and 30-day mortality. The comparative analysis of prediction models also showed statistically significant prediction improvement when indicators were included. Moreover, missing data might reflect the opinions of examining clinicians. Therefore, the absence of measurements can be informative in ICUs and has predictive power beyond the measured data themselves. This initial case study shows promise for more in-depth analysis of missing data and its informativeness in ICUs. Future studies are needed to generalize these results.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>electronic health records</kwd>
        <kwd>clinical laboratory tests</kwd>
        <kwd>machine learning</kwd>
        <kwd>hospital mortality</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The increased adoption of electronic health record (EHR) systems has boosted interest in the secondary use of EHR data [<xref ref-type="bibr" rid="ref1">1</xref>]. Although the literature has introduced various dimensions for EHR data quality, completeness and correctness have been reported as the fundamental dimensions [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Although these issues can also be observed in paper-based records, EHR brought us the opportunity to identify them faster and helped us with addressing them. The data missing from clinical contexts are substantial [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>] and unavoidable [<xref ref-type="bibr" rid="ref5">5</xref>]; many studies have focused on resolving this issue [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Although many researchers treat missing data as a challenge [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref18">18</xref>], others continue to debate whether lack of completeness also provides useful information [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Researchers do agree that a part of this incompleteness is not random or because of imperfections in the data collection process [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Recently, Angiel et al [<xref ref-type="bibr" rid="ref21">21</xref>] demonstrated that the laboratory ordering time (ie, the interval between 2 orders of a laboratory test; LT) for some LT is more informative than the actual values in predicting 3-year survival. Our study focuses on systematically investigating the implications or possible value of lack of data, particularly in intensive care units (ICUs) and proposes a representation method for missing data to capture hidden information. In general, 2 reasons are given for missing data in EHRs:</p>
        <list list-type="bullet">
          <list-item>
            <p>No intention to collect: the clinical variable was never measured because there was no clinical indication to do so—the patient was not suffering from a relevant symptom or comorbidity [<xref ref-type="bibr" rid="ref4">4</xref>] or it could not be measured [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
          </list-item>
          <list-item>
            <p>Intention to collect: records are missing although the variables were measured [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
          </list-item>
        </list>
        <p>Therefore, the health care process (eg, clinicians’ decision to order a test and nurse data entry) affects the recorded EHR and can cause incompleteness in data.</p>
        <p>Incomplete EHR data can complicate or prohibit the data analysis process, as many machine learning (ML) algorithms assume that there are no missing data in the dataset or require users to clean the data in the preprocessing stage and so provide a complete dataset. Therefore, from a research perspective, the ideal situation is to increase the amount and accuracy of EHR documentation by employing approaches that focus on intention to collect such as reducing the error in data entry or increasing data documentation in terms of resolution. Although the current amount of testing and bloodwork has been reported as actually redundant in ICUs [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>] and requires extra time and work from clinicians [<xref ref-type="bibr" rid="ref4">4</xref>], these approaches suffer from their own shortcomings. Besides analytical methods that can handle missing data (that are missing at random) such as decision trees (DTs) or mixed-effects models for longitudinal data, other approaches usually assume missing data are missing completely at random. In general, the literature proposes 3 analytical approaches: complete case analysis (CCA) or deletion, available case analysis (ACA), and imputation.</p>
        <p>CCA starts with the list of variables included in the analysis and discards records with missing data on any of the variables. However, this subsample might not be a random sample of the population. Although researchers argue that sample selection based on the predefined eligibility criteria in randomized clinical trials can limit the external generalizability of these studies [<xref ref-type="bibr" rid="ref26">26</xref>], CCA in studies using EHR data can also potentially threaten the external validity of a study [<xref ref-type="bibr" rid="ref19">19</xref>] and cause bias as the literature shows a statistically significant relationship between severity of illness and data completeness [<xref ref-type="bibr" rid="ref20">20</xref>]. A study [<xref ref-type="bibr" rid="ref19">19</xref>] on 10,000 EHRs from patients receiving anesthetic service showed that patients with an anesthesiologists physical status (ASA) [<xref ref-type="bibr" rid="ref27">27</xref>] class-4 fitness rating had 5.05 more days with laboratory results and 6.85 more days with medication orders than patients with ASA class 1, suggesting more data are recorded for sicker patients than healthier patients. Thus, imposing complete case requirements when using EHR data for secondary use can cause bias toward selecting patients with more severe conditions (or several comorbidities). Despite this drawback, CCA has been identified as the leading approach in studies on ICU data [<xref ref-type="bibr" rid="ref28">28</xref>]. That said, CCA provides valid inference only when data are missing completely at random (MCAR), which is unlikely in practice [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>The ACA (or pairwise deletion) uses all available data for a given analysis. In other words, it maximizes the availability of data by an analysis-by-analysis basis [<xref ref-type="bibr" rid="ref30">30</xref>]. The advantage of this method is that more data are included in each analysis than with CCA. It also allows for valid inference by likelihood-based models when missing data are ignorable—often the case when the data are missing at random (MAR) [<xref ref-type="bibr" rid="ref29">29</xref>]. Although ACA is an improvement to CCA [<xref ref-type="bibr" rid="ref30">30</xref>], it also has limitations. As different samples are being used in each analysis, not only is comparison of various analyses impossible [<xref ref-type="bibr" rid="ref31">31</xref>] but also using different samples for estimating the parameters of interest has occasionally led to biased or mathematically inconsistent results [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        <p>Imputation methods, which try to draw inferences from incomplete data, rely on knowing the mechanism of missingness, which cannot be validated from the available data. Single imputation methods suffer from 2 problems. First, an inference based on imputed data can be biased if the underlying assumptions are not valid. Second, because imputed data are assumed to be true, the model’s statistical precision is overstated. Multiple imputation methods, in spite of their promising performance, rely on parametric assumptions that, if not valid, can lead to incorrect imputation. Due to these limitations, imputation methods should be used with caution and checking underlying assumptions with clinicians is highly recommended [<xref ref-type="bibr" rid="ref5">5</xref>]. However, Gorelick [<xref ref-type="bibr" rid="ref35">35</xref>], in a simulation study, demonstrated that either CCA or imputation could cause bias in predictive modeling, and that assuming missing values to be normal when missingness rates are high and substituting them with normal values would also cause substantial bias. In brief, if primary assumptions are not fully satisfied, neither considering complete or available cases nor imputating missing data is likely to yield reliable results. Furthermore, these statistical methods on their own are not sufficient to capture the hidden information about the patient health status and care process in the complex EHR data. Alternatively, we can try to learn from what is missing rather than only dealing with missingness as a deficiency.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>This case study provides evidence that missing data in ICU might be missing because of the patient’s health status or health care process and introduces a new method for representing patient profiles. In this representation, auxiliary variables, called indicators, are used to represent the presence or absence of a measurement and might convey the possible hidden information in the missing data. Then, by employing various analytical methods, this study attempts to demonstrate the informativeness of missing data. In the rest of the study, the term <italic>missing data</italic> is used to describe not-at-random missing information in patient profiles. In other words, the potential informativeness of data that has not been recorded by choice is of interest.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Measurement Protocol and Data Collection</title>
        <p>As patient monitoring strongly relies on clinical needs, no universal standards for ICU data completeness have been established [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref38">38</xref>]. However, a study by Frassica in 2005 [<xref ref-type="bibr" rid="ref39">39</xref>] published a list of the top 80% of LTs common to all ICU patients within a university teaching hospital. We revised this list based on the presence of these tests in our database and updated it with input from an ICU clinician to reflect current practices (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>).</p>
        <p>The data for this study were collected from the Medical Information Mart for Intensive Care III (MIMIC-III) [<xref ref-type="bibr" rid="ref40">40</xref>] database which contains data from 38,597 distinct adult patients admitted to the Beth Israel Deaconess Medical Center in Boston, Massachusetts, between 2001 and 2012. For patient cohort selection, a tailored version of the generalized cohort selection heuristics for retrospective EHR studies introduced by Harrell et al [<xref ref-type="bibr" rid="ref41">41</xref>] was used. The data for first admission to 1 of the 5 ICUs—medical ICU, surgical ICU, cardiac care unit, cardiac surgery recovery unit, and trauma surgical ICU—were extracted for adult patients (aged 15 years or older). Included patients must have had at least one data point in any of the variable categories during the first, second, and third days of their ICU stay.</p>
      </sec>
      <sec>
        <title>Data Preprocessing and Missing Data Representation</title>
        <p>Each day’s extracted data were mapped into a matrix with columns for measurements and rows for patients. Therefore, we had a column for each daily measurement of LTs, resulting in 36 columns for LTs. An auxiliary matrix was generated to store binary values reflecting the presence (0) or absence (1) of measurements. As many well-performing ML algorithms are designed to work with a complete data matrix, 2 methods—predictive mean matching (PMM) [<xref ref-type="bibr" rid="ref42">42</xref>] and hot deck (HD)—were used to impute missing values. PMM is a commonly used and well-accepted imputation method in public health research [<xref ref-type="bibr" rid="ref43">43</xref>] and is also robust against model misspecification [<xref ref-type="bibr" rid="ref44">44</xref>]. HD imputation is used commonly in applied data analysis when missing data exist [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
        <boxed-text id="box1" position="float">
          <title>A total of 36 laboratory tests used in investigating informativeness of missing data.</title>
          <p>Variable category and variables</p>
          <p>Top 80% laboratory tests and profiles common to all intensive care units [<xref ref-type="bibr" rid="ref39">39</xref>] reviewed and revised by domain expert</p>
          <list list-type="bullet">
            <list-item>
              <p>Alanine aminotransferase (ALT)</p>
            </list-item>
            <list-item>
              <p>Alkaline phosphatase (ALK)</p>
            </list-item>
            <list-item>
              <p>Aspartate aminotransferase (AST)</p>
            </list-item>
            <list-item>
              <p>Arterial blood gases: pH, partial pressure of carbon dioxide (PCO<sub>2</sub>), and partial pressure of oxygen (PO<sub>2</sub>)</p>
            </list-item>
            <list-item>
              <p>Base excess (BE)</p>
            </list-item>
            <list-item>
              <p>Basic metabolic panel: sodium (Na), potassium (K), chloride (Cl), bicarbonate (HCO<sub>3</sub>), anion gap (AG), blood glucose (BG), blood urea nitrogen (BUN), and creatinine (Cr)</p>
            </list-item>
            <list-item>
              <p>Complete blood count: white blood cells (WBCs), red blood cells (RBCs), hemoglobin (HGB), hematocrit (HCT), mean corpuscular volume (MCV), mean corpuscular hemoglobin (MCH), mean corpuscular hemoglobin concentration (MCHC), red cell distribution width (RDW), platelet count (PLT), absolute monocytes (MO), absolute eosinophils (EO), absolute basophils (BA), absolute lymphocytes (LY), and absolute neutrophils (NE)</p>
            </list-item>
            <list-item>
              <p>Lactate (Lac)</p>
            </list-item>
            <list-item>
              <p>Calcium (Ca)</p>
            </list-item>
            <list-item>
              <p>Magnesium (Mg)</p>
            </list-item>
            <list-item>
              <p>Phosphate (Phos)</p>
            </list-item>
            <list-item>
              <p>Partial thromboplastin time (PTT)</p>
            </list-item>
            <list-item>
              <p>Prothrombin time (PT)</p>
            </list-item>
            <list-item>
              <p>Total bilirubin (TBil)</p>
            </list-item>
          </list>
        </boxed-text>
        <p>Given that imputed values are indistinguishable to the ML algorithm from true values, we combined the original matrix and auxiliary matrix to form an augmented matrix that directly indicates where values were imputed. This was done to mitigate the risk of treating imputed values the same as actual values, in a setting where the underlying reason for missing data is not fully known (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Missing data indicators in this augmented matrix might also provide extra information about the reliability of the values (actual and imputed values) and potentially preserve any meaningful missing data patterns. Missingness indicators have been used as a method of handling missing data in epidemiological and clinical studies. However, in the current use of indicators, missing values are set to a fixed value (0 or the normal value for the variable) and the indicators are used as dummy variables in analytical models to indicate that a value was missing [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. Studies have shown that this method causes bias as the missing values are imputed with a single value [<xref ref-type="bibr" rid="ref48">48</xref>]. In our study, we are not using indicators as dummy variables; instead, we are introducing them as a source of information to be used besides imputation methods.</p>
      </sec>
      <sec>
        <title>Validation</title>
        <p>Several validation techniques are available in medical research. In this study, for all experiments where applicable, we used cross-validation technique (10-fold cross-validation). We also repeated the cross-validation procedure several times (20 times) to acquire more stable results as suggested in the literature [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>An example of the augmented data matrix, the imputed data matrix (imputed values are underlined and italicized), and the auxiliary matrix (containing the missingness indicators: 0-present, 1-absent).</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Assessments</title>
        <sec>
          <title>Exploratory Analysis</title>
          <p>First, the trends of missingness among LTs were visualized for comparison. Afterward, pairwise correlation among indicators, using Phi coefficient, was done to explore the general behavior of missingness. The Elixhauser [<xref ref-type="bibr" rid="ref50">50</xref>] and the Charlson [<xref ref-type="bibr" rid="ref51">51</xref>] comorbidity indices are the most common comorbidity scores in clinical applications. The literature has shown that the Elixhauser Comorbidity Index (ECI) in general has the best performance [<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref55">55</xref>]. This better performance can be the result of (1) including new comorbidities in ECI, (2) the differences in the coding of variables common between both indices, or (3) a combination of the first and second factors [<xref ref-type="bibr" rid="ref53">53</xref>]. The Simplified Acute Physiology Score II (SAPS-II) [<xref ref-type="bibr" rid="ref56">56</xref>] scoring system that has been widely used by most ICUs for predicting illness severity was also chosen. Therefore, the association of missingness rates with ECI and SAPS-II was investigated using Spearman correlation. Besides the clinical information, SAPS-II also has the information about type of admission (scheduled surgical, medical, or unscheduled surgical) and presence of 3 chronic diseases (metastatic cancer, hematologic malignancy, and AIDS).</p>
        </sec>
        <sec>
          <title>Feature Selection</title>
          <p>After exploratory analyses, we assessed the importance of the indicators as potential predictors. First, we used feature selection methods, which are widely used to determine which predictors should be used in a model, particularly for high-dimensional data [<xref ref-type="bibr" rid="ref22">22</xref>]. Two copies of the augmented matrix (derived from HD and PMM imputation) were fed to various feature selection methods. Our study considered in-hospital and 30-day postdischarge mortality as outcomes. Overall, we used 2 categories of supervised feature selection methods described below.</p>
          <p>First, filter techniques evaluated the importance of a predictor by looking at data properties. Filter methods, in general, use a metric to identify irrelevant features and filter out the redundant predictors from the data matrix [<xref ref-type="bibr" rid="ref57">57</xref>]. We selected 3 different metrices: LR beta value, relief algorithm [<xref ref-type="bibr" rid="ref58">58</xref>], and information gain (InfGain) [<xref ref-type="bibr" rid="ref59">59</xref>]. The relief algorithm examines the relevance of predictors based on their power to distinguish between similar patients with the same and different outcome. InfGain measures the reduction in entropy of the class variable achieved by partitioning the data based on the index predictor; relevant predictors receive a high InfGain value [<xref ref-type="bibr" rid="ref60">60</xref>]. This ensemble of the scoring methods was then used to determine the normalized informativeness of all predictors. Aggregating these methods in one score provides a tool for comparing predictors from different aspects.</p>
          <p>Second, we used embedded techniques to search for the optimal set of predictors. In these techniques, feature selection is embedded in the model’s construction and interacts with the classifier. Least absolute shrinkage and selection operator (LASSO), used in this study, is a penalizing method in this category. LASSO regression in its objective functions considers a penalty that equals to the sum of the absolute values of the coefficients. As absolute function (L<sub>1</sub> norm) is not differentiable, the estimated coefficients are close to 0, and some will be exactly 0 resulting in an automatic variable selection. For this and the next experiments, 10-fold cross-validation with 20 repeats was used (leading to 200 repetitions in total). This number of repetitions is recommended to achieve desired accuracy for prediction performance estimation [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
        </sec>
        <sec>
          <title>Predictive Modeling</title>
          <p>In the last assessment, we first trained group of classification models, including DT, logistic regression (LR), and random forest (RF), on the indicator and imputed data matrices and evaluate their performance for predicting desired outcomes using the area under the curve of the receiver operating characteristic (AUROC) validation metric. Thereafter, new models were trained using the augmented data matrix and their performance was compared with that of the original to determine whether the indicators have predictive power and can boost the models’ predictive accuracy. We also investigated the predictive performance of SAPS-II score, and then we added indicators to these scores to examine the impact of indicators beyond SAPS-II score. It is worth mentioning that in this assessment, the absolute accuracy of the models is not of our interest, instead, the relative improvement in the performance when including indicators as input. That is, achieving the best possible mortality prediction AUROC is not the objective of this study.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Population</title>
        <p>The analyses of the first 24 hours ICU stays included 32,618 patients but decreased to 20,381 for the second 24-hour interval, as many patients were discharged after 24 hours. The third 24-hour period included 13,670 patients. Of these groups, 10.99% (3586/32,618), 13.59% (2769/20,381), and 16.19% (2213/13,670) experienced death in-hospital and 15.12% (4933/32,618), 18.26% (3722/20,381), and 21.32% (2915/ 13,670) experienced death within 30 days of discharge, respectively. <xref rid="figure2" ref-type="fig">Figure 2</xref> demonstrates the retrospective study design.</p>
      </sec>
      <sec>
        <title>Exploratory Analysis</title>
        <p>Missingness rates for LTs ranges from 1.36% (445/32,618) to 88.27% (12066/13,670) in the first 72 hours after admission. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows the missingness rate for LTs over 3 days. Absolute basophils (BA), absolute eosinophils (EO), absolute monocytes (MO), absolute lymphocytes (LY), absolute neutrophils (NE), alanine aminotransferase (ALT), alkaline phosphatase (ALK), aspartate aminotransferase (AST), total bilirubin (TBil), and lactate (Lac) were among the less-common LTs and were missing in the profiles of more than 60% of patients.</p>
        <p>We calculated the association between each indicator and the mortality flag. Although association values were small, on day 1, ALT, ALK, AST, and TBil stand out as the top LTs associated with both types of mortality.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The retrospective cohort study design. LOS: length of stay.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The average missingness rate among patients for laboratory tests in the first 72 hours of admission.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p/>
        <p>On days 2 and 3, partial pressure of carbon dioxide (PCO<sub>2</sub>), partial pressure of oxygen (PO<sub>2</sub>), and base excess (BE) were the top LTs associated with both mortality types. Lac also joined the top tests on day 2 for 30-day mortality. Detailed association values are provided in See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p><xref rid="figure4" ref-type="fig">Figure 4</xref> visualizes the pairwise correlations among indicators. In total, 7 major groups of highly correlated (ρ ≥.95) indicators were observed in the results using Phi coefficient: (1) BA, MO, NE, EO, and LY; (2) mean corpuscular hemoglobin concentration (MCHC), red cell distribution width (RDW) mean corpuscular volume (MCV), red blood cell (RBC), and mean corpuscular hemoglobin (MCH); (3) BE, PCO<sub>2</sub>, and PO<sub>2</sub>; (4) TBil, ALT, AST, and ALK; (5) Blood urea nitrogen (BUN) and creatinine (Cr); (6) chloride (Cl) and bicarbonate (HCO<sub>3</sub>); (7) partial thromboplastin time (PTT) and prothrombin time (PT).</p>
        <p>The Spearman correlation between missingness rates and ECI was also calculated daily. Results show a statistically significant correlation between these variables (day 1: ρ=–.233; day 2: ρ=–.196; day 3: ρ=–.184; <italic>P</italic>&lt;.001). The same assessment was done using SAPS-II. The results were in line with the previous one and demonstrate higher correlation (day 1: ρ=–.315; day 2: ρ=–.277; day 3=–.234; <italic>P</italic>&lt;.001). These findings are interesting as they confirm that the missingness of data is associated with patient severity of illness.</p>
      </sec>
      <sec>
        <title>Feature Selection: Missing Data Indicators as Important Predictors</title>
        <p>Each of the imputation methods was applied to the original dataset, and the potential informativeness of missingness indicators in comparison with actual variables was investigated using an ensemble of the most representative filter selection methods [<xref ref-type="bibr" rid="ref61">61</xref>]: LR beta value, relief, and InfGain. <xref ref-type="table" rid="table1">Table 1</xref> shows the top 18 variables selected on each day based on the PMM-generated imputed matrix predicting 30-day mortality. BUN, RDW, and anion gap (AG) were among the top variables in all 3 days. Indicators for TBil, phosphate (Phos), calcium (Ca), and Lac were selected on the first day, whereas indicators for Lac, BE, PO<sub>2</sub>, and PCO<sub>2</sub> were among the top features on the second and third days. PTT and pH indicators were also among the important indicators on the third day.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Visualization of the correlation matrix for variable indicators in first 72 hours.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The top 18 variables selected on each day after employing predictive mean matching imputation with regard to 30-day mortality. <italic>I</italic> at the beginning of the variables’ names means <italic>indicator</italic>. Numbers represent the ranking after aggregating the ranking results from the 3 different feature selection methods.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <col width="160"/>
            <col width="170"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Day 1</td>
                <td colspan="2">Day 2</td>
                <td colspan="2">Day 3</td>
              </tr>
              <tr valign="top">
                <td>Variable</td>
                <td>Score</td>
                <td>Variable</td>
                <td>Score</td>
                <td>Variable</td>
                <td>Score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>BUN<sup>a</sup></td>
                <td>.762397</td>
                <td>AG<sup>b</sup></td>
                <td>.795419</td>
                <td>RDW<sup>c</sup></td>
                <td>.748997</td>
              </tr>
              <tr valign="bottom">
                <td>RDW</td>
                <td>.680087</td>
                <td>HCO<sub>3</sub><sup>d</sup></td>
                <td>.783337</td>
                <td>BUN</td>
                <td>.666667</td>
              </tr>
              <tr valign="bottom">
                <td>MCHC<sup>e</sup></td>
                <td>.668965</td>
                <td>BUN</td>
                <td>.77677</td>
                <td>HCO<sub>3</sub></td>
                <td>.544964</td>
              </tr>
              <tr valign="bottom">
                <td>AG</td>
                <td>.540484</td>
                <td>BE<sup>f</sup></td>
                <td>.609532</td>
                <td>BE</td>
                <td>.540542</td>
              </tr>
              <tr valign="bottom">
                <td>I-Ca<sup>g</sup></td>
                <td>.436429</td>
                <td>RDW</td>
                <td>.608711</td>
                <td>pH</td>
                <td>.488433</td>
              </tr>
              <tr valign="bottom">
                <td>Cr<sup>h</sup></td>
                <td>.436071</td>
                <td>I-PO<sub>2</sub><sup>i</sup></td>
                <td>.587151</td>
                <td>AG</td>
                <td>.450426</td>
              </tr>
              <tr valign="bottom">
                <td>HCO<sub>3</sub></td>
                <td>.416741</td>
                <td>I-PCO<sub>2</sub></td>
                <td>.585947</td>
                <td>I-Lac<sup>j</sup></td>
                <td>.418716</td>
              </tr>
              <tr valign="top">
                <td>PO<sub>2</sub><sup>k</sup></td>
                <td>.404289</td>
                <td>I-BE</td>
                <td>.585592</td>
                <td>I-pH</td>
                <td>.40463</td>
              </tr>
              <tr valign="bottom">
                <td>MCV<sup>l</sup></td>
                <td>.386964</td>
                <td>Cl<sup>m</sup></td>
                <td>.53158</td>
                <td>Cr</td>
                <td>.400008</td>
              </tr>
              <tr valign="bottom">
                <td>I-Phos<sup>n</sup></td>
                <td>.374431</td>
                <td>PT<sup>o</sup></td>
                <td>.462085</td>
                <td>Phos</td>
                <td>.387661</td>
              </tr>
              <tr valign="bottom">
                <td>PTT<sup>p</sup></td>
                <td>.353913</td>
                <td>Lac</td>
                <td>.461869</td>
                <td>I-PCO<sub>2</sub></td>
                <td>.387019</td>
              </tr>
              <tr valign="bottom">
                <td>HGB<sup>q</sup></td>
                <td>.342786</td>
                <td>Cr</td>
                <td>.451999</td>
                <td>I-PO<sub>2</sub></td>
                <td>.386739</td>
              </tr>
              <tr valign="top">
                <td>pH</td>
                <td>.32767</td>
                <td>PTT</td>
                <td>.424956</td>
                <td>I-BE</td>
                <td>.385935</td>
              </tr>
              <tr valign="bottom">
                <td>Lac</td>
                <td>.320339</td>
                <td>Na<sup>r</sup></td>
                <td>.422474</td>
                <td>PCO<sub>2</sub></td>
                <td>.367257</td>
              </tr>
              <tr valign="bottom">
                <td>BE</td>
                <td>.320299</td>
                <td>Phos</td>
                <td>.419171</td>
                <td>NE<sup>s</sup></td>
                <td>.360791</td>
              </tr>
              <tr valign="top">
                <td>I-Lac</td>
                <td>.318216</td>
                <td>I-Lac</td>
                <td>.415475</td>
                <td>MCV</td>
                <td>.351266</td>
              </tr>
              <tr valign="top">
                <td>PCO<sub>2</sub></td>
                <td>.316668</td>
                <td>MCV</td>
                <td>.368343</td>
                <td>I-PTT</td>
                <td>.338352</td>
              </tr>
              <tr valign="bottom">
                <td>I-TBil<sup>t</sup></td>
                <td>.31277</td>
                <td>MCHC</td>
                <td>.363146</td>
                <td>Lac</td>
                <td>.331205</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>BUN: blood urea nitrogen.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>AG: anion gap.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>RDW: red cell distribution width.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>HCO<sub>3</sub>: bicarbonate.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>MCHC: mean corpuscular hemoglobin concentration.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>BE: base excess.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>CA: calcium.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>Cr: creatinine.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>PO<sub>2</sub>: partial pressure of oxygen.</p>
            </fn>
            <fn id="table1fn10">
              <p><sup>j</sup>Lac: lactate.</p>
            </fn>
            <fn id="table1fn11">
              <p><sup>k</sup>PCO<sub>2</sub>: partial pressure of carbon dioxide.</p>
            </fn>
            <fn id="table1fn12">
              <p><sup>l</sup>MCV: mean corpuscular volume.</p>
            </fn>
            <fn id="table1fn13">
              <p><sup>m</sup>Cl: chloride.</p>
            </fn>
            <fn id="table1fn14">
              <p><sup>n</sup>Phos: phosphate.</p>
            </fn>
            <fn id="table1fn15">
              <p><sup>o</sup>PT: prothrombin time.</p>
            </fn>
            <fn id="table1fn16">
              <p><sup>p</sup>PTT: partial thromboplastin time.</p>
            </fn>
            <fn id="table1fn17">
              <p><sup>q</sup>HGB: hemoglobin.</p>
            </fn>
            <fn id="table1fn18">
              <p><sup>r</sup>Na: sodium.</p>
            </fn>
            <fn id="table1fn19">
              <p><sup>s</sup>NE: absolute neutrophils.</p>
            </fn>
            <fn id="table1fn20">
              <p><sup>t</sup>TBil: total bilirubin.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p/>
        <p>Similar results were observed when using the HD imputation method, except that ALT and Phos were also selected on the first and second day, respectively. Moreover, PTT and pH indicators were not among the important indicators on the third day. Detailed results of this assessment can be found in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>Results for in-hospital mortality were slightly different (<xref ref-type="table" rid="table2">Table 2</xref>). Although the selected indicators were almost the same as for 30-day mortality, more indicators were selected on the first day for in-hospital mortality, implying that indicators are more associated with in-hospital mortality than 30-day mortality. Detailed results are available in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>To validate our previous results, we assessed the predictive power of the indicators using embedded feature selection methods. Each day, a LASSO model was trained on the augmented data from HD and PMM imputation using 10-fold cross-validation with 20 repeats. In general, the AUROC of mortality prediction (in-hospital and 30-day postdischarge) and number of selected variables decreased from days 1 to 3 (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
        <p>Moreover, prediction of in-hospital mortality resulted in higher AUROCs than 30-day mortality. Regardless of mortality type, on all days, more than 40% of the predictors selected by the best-performing model were indicators. Moreover, more than 61% of selected predictors were indicators on the third day. Sliding lambda to compromise the predictor number and model performance led to almost the same results. Generally, more than 40% of the selected predictors were indicators, and on the third day, this number increased to 61%.</p>
        <p>Results in this section once more confirm the informativeness of missing data as missingness indicators have been selected by various feature selection methods. The high percentage of selected indicators also implies that the actual value of an LT is not always required in outcome prediction; instead, knowledge about whether the test was performed would suffice.</p>
      </sec>
      <sec>
        <title>Predictive Modeling: Missing Data Indicators in Predictive Modeling</title>
        <p>In the second assessment, we compared the performance of a set of 3 classification models (DT, LR, and RF) using the indicators, imputed and augmented data matrices, and SAPS-II score with or without indicators with 10-fold cross-validation over 20 repeats. We investigated whether including indicators can improve prediction and whether indicators alone have predictive power. For our LR, the iteratively reweighted least square method was used to fit the model. The complexity parameter (CP) for DT was tuned based on the model performance. On the basis of some preliminary model fitting, we set the CP value to vary from 0 (including all variables and having a large tree) to .02 for each model and then we picked the best performance model. In all models, the best-tuned model had a CP greater than 0. <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the AUROC with 95% CI for all 3 days with regard to 30-day mortality (<xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> provides the AUROC values for 30-day mortality and in-hospital mortality).</p>
        <p>Including indicators improved the AUROC in all modeling techniques, on average by 0.0511; the maximum improvement was 0.1209 (<xref rid="figure5" ref-type="fig">Figure 5</xref>). AUROC has been demonstrated as an insensitive metric, for which an increase of 0.01 suggests meaningful improvement and is clinically of interest [<xref ref-type="bibr" rid="ref62">62</xref>-<xref ref-type="bibr" rid="ref64">64</xref>]. Although using only indicators demonstrated reasonable performance in all scenarios (AUROC=0.6019 [0.0862]&gt;0.5), conventional scores such as SAPS II perform better (AUROC=0.6390 [0.0853]) on their own. Therefore, models trained only on indicators are not sufficient. However, including indicators with conventional scores can improve the performance (AUROC=0.7263 [0.0578]). The SAPS-II score has information for age, heart rate, systolic blood pressure, Glasgow coma scale, temperature, mechanical ventilation administration, partial pressure of oxygen in the arterial blood (PaO<sub>2</sub>), fraction of inspired oxygen (FiO<sub>2</sub>), urine output, BUN, sodium (Na), potassium (K), HCO<sub>3</sub>, TBil, white blood cells (WBCs), presence of chronic diseases, and type of admission. These results demonstrate that indicators have information beyond that included in SAPS-II.</p>
        <p><xref rid="figure6" ref-type="fig">Figure 6</xref> demonstrates the AUROC curves for LR 30-day mortality prediction on day 1.</p>
        <p>This combination of findings provides more support for the informativeness of missing data. Employing the missing indicators in mortality prediction modeling can improve the results in comparison to not including them.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The top 18 variables selected on each day after employing predictive mean matching imputation with regard to in-hospital mortality. <italic>I</italic> at the beginning of the variables names means <italic>indicator</italic>. Numbers represent the ranking after aggregating the ranking results from the 3 different feature selection methods.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <col width="160"/>
            <col width="170"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Day 1</td>
                <td colspan="2">Day 2</td>
                <td colspan="2">Day 3</td>
              </tr>
              <tr valign="top">
                <td>Variable</td>
                <td>Score</td>
                <td>Variable</td>
                <td>Score</td>
                <td>Variable</td>
                <td>Score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>BUN<sup>a</sup></td>
                <td>.825715</td>
                <td>BUN</td>
                <td>1</td>
                <td>RDW<sup>b</sup></td>
                <td>.75246</td>
              </tr>
              <tr valign="bottom">
                <td>AG<sup>c</sup></td>
                <td>.668918</td>
                <td>RDW</td>
                <td>.711852</td>
                <td>BUN</td>
                <td>.635729</td>
              </tr>
              <tr valign="bottom">
                <td>RDW</td>
                <td>.573188</td>
                <td>HCO<sub>3</sub><sup>d</sup></td>
                <td>.684191</td>
                <td>BE<sup>e</sup></td>
                <td>.633926</td>
              </tr>
              <tr valign="top">
                <td>HCO<sub>3</sub></td>
                <td>.531746</td>
                <td>AG</td>
                <td>.664339</td>
                <td>HCO<sub>3</sub></td>
                <td>.62367</td>
              </tr>
              <tr valign="bottom">
                <td>MCHC<sup>f</sup></td>
                <td>.507343</td>
                <td>BE</td>
                <td>.528778</td>
                <td>I-BE</td>
                <td>.595553</td>
              </tr>
              <tr valign="bottom">
                <td>PCO<sub>2</sub><sup>g</sup></td>
                <td>.489483</td>
                <td>MCHC</td>
                <td>.503805</td>
                <td>I-PCO<sub>2</sub></td>
                <td>.595238</td>
              </tr>
              <tr valign="bottom">
                <td>Cr<sup>h</sup></td>
                <td>.480181</td>
                <td>PT<sup>i</sup></td>
                <td>.453111</td>
                <td>I-PO<sub>2</sub><sup>j</sup></td>
                <td>.594924</td>
              </tr>
              <tr valign="bottom">
                <td>BE</td>
                <td>.452599</td>
                <td>Cl<sup>k</sup></td>
                <td>.429405</td>
                <td>pH</td>
                <td>.556242</td>
              </tr>
              <tr valign="bottom">
                <td>I-Lac<sup>l</sup></td>
                <td>.436382</td>
                <td>I-Lac</td>
                <td>.425279</td>
                <td>Phos<sup>m</sup></td>
                <td>.494694</td>
              </tr>
              <tr valign="top">
                <td>Lac</td>
                <td>.415773</td>
                <td>Cr</td>
                <td>.395266</td>
                <td>AG</td>
                <td>.492864</td>
              </tr>
              <tr valign="bottom">
                <td>HGB<sup>n</sup></td>
                <td>.414263</td>
                <td>I-PO<sub>2</sub></td>
                <td>.382404</td>
                <td>I-pH</td>
                <td>.470007</td>
              </tr>
              <tr valign="top">
                <td>pH</td>
                <td>.402466</td>
                <td>I-PCO<sub>2</sub></td>
                <td>.381737</td>
                <td>I-Lac</td>
                <td>.469215</td>
              </tr>
              <tr valign="bottom">
                <td>I-TBil<sup>o</sup></td>
                <td>.399363</td>
                <td>I-BE</td>
                <td>.381448</td>
                <td>Cr</td>
                <td>.415249</td>
              </tr>
              <tr valign="bottom">
                <td>I-Ca</td>
                <td>.395278</td>
                <td>PTT<sup>p</sup></td>
                <td>.357339</td>
                <td>Lac</td>
                <td>.396136</td>
              </tr>
              <tr valign="bottom">
                <td>I-ALT<sup>q</sup></td>
                <td>.376004</td>
                <td>Phos</td>
                <td>.352738</td>
                <td>NE<sup>r</sup></td>
                <td>.338372</td>
              </tr>
              <tr valign="bottom">
                <td>I-AST<sup>s</sup></td>
                <td>.375944</td>
                <td>Na<sup>t</sup></td>
                <td>.345109</td>
                <td>PT</td>
                <td>.326491</td>
              </tr>
              <tr valign="bottom">
                <td>LY<sup>u</sup></td>
                <td>.375163</td>
                <td>I-PT</td>
                <td>.333936</td>
                <td>LY</td>
                <td>.319146</td>
              </tr>
              <tr valign="bottom">
                <td>I-ALK<sup>v</sup></td>
                <td>.366346</td>
                <td>BG<sup>w</sup></td>
                <td>.320947</td>
                <td>MCV<sup>x</sup></td>
                <td>.314868</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>BUN: blood urea nitrogen.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>RDW: red cell distribution width.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>AG: anion gap.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>HCO<sub>3</sub>: bicarbonate.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>BE: base excess.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>MCHC: mean corpuscular hemoglobin concentration.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>PCO<sub>2</sub>: partial pressure of carbon dioxide.</p>
            </fn>
            <fn id="table2fn8">
              <p><sup>h</sup>Cr: creatinine.</p>
            </fn>
            <fn id="table2fn9">
              <p><sup>i</sup>PT: prothrombin time.</p>
            </fn>
            <fn id="table2fn10">
              <p><sup>j</sup>PO<sub>2</sub>: partial pressure of oxygen.</p>
            </fn>
            <fn id="table2fn11">
              <p><sup>k</sup>Cl: chloride.</p>
            </fn>
            <fn id="table2fn12">
              <p><sup>l</sup>Lac: lactate.</p>
            </fn>
            <fn id="table2fn13">
              <p><sup>m</sup>Phos: phosphate.</p>
            </fn>
            <fn id="table2fn14">
              <p><sup>n</sup>HGB: hemoglobin.</p>
            </fn>
            <fn id="table2fn15">
              <p><sup>o</sup>TBil: total bilirubin.</p>
            </fn>
            <fn id="table2fn16">
              <p><sup>p</sup>PTT: partial prothrombin time.</p>
            </fn>
            <fn id="table2fn17">
              <p><sup>q</sup>ALT: alanine transaminase.</p>
            </fn>
            <fn id="table2fn18">
              <p><sup>r</sup>NE: absolute neutrophils.</p>
            </fn>
            <fn id="table2fn19">
              <p><sup>s</sup>AST: aspartate transaminase</p>
            </fn>
            <fn id="table2fn20">
              <p><sup>t</sup>Na: sodium</p>
            </fn>
            <fn id="table2fn21">
              <p><sup>u</sup>LY: absolute lymphocytes.</p>
            </fn>
            <fn id="table2fn22">
              <p><sup>v</sup>ALK: alkaline phosphatase.</p>
            </fn>
            <fn id="table2fn23">
              <p><sup>w</sup>BG: blood glucose.</p>
            </fn>
            <fn id="table2fn24">
              <p><sup>x</sup>MCV: mean corpuscular volume.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Results from feature selection by least absolute shrinkage and selection operator (LASSO) for 3 days (area under the curve of the receiver operating characteristics are reported with the SE). The <italic>best performing model</italic> refers to the model with a lambda value associated with minimum cross-validation error. The adjusted model refers to a LASSO model with the largest value of lambda such that the error remains within 1 SE of the minimum.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="490"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Criteria, outcome, and imputation method</td>
                <td>Day 1</td>
                <td>Day 2</td>
                <td>Day 3</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>AUROC<sup>a</sup></bold>
                  <bold>for best performing model</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>30-day mortality</bold>
                </td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD<sup>b</sup></td>
                <td>0.7858 (0.0033)</td>
                <td>0.7685 (0.0041)</td>
                <td>0.7302 (0.0043)</td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM<sup>c</sup></td>
                <td>0.7876 (0.0039)</td>
                <td>0.7708 (0.0046)</td>
                <td>0.7391 (0.0053)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>In-hospital mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>0.7983 (0.0040)</td>
                <td>0.7804 (0.0046)</td>
                <td>0.7476 (0.0042)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>0.8007 (0.0047)</td>
                <td>0.7838 (0.0049)</td>
                <td>0.7582 (0.0054)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Indicators among selected predictors by the best performing model, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>30-day mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>23 (43)</td>
                <td>24 (48)</td>
                <td>19 (707)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>26 (45)</td>
                <td>26 (47)</td>
                <td>17 (68)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>In-hospital mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>28 (46)</td>
                <td>29 (48)</td>
                <td>21 (60)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>29 (47)</td>
                <td>27 (49)</td>
                <td>24 (62)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>AUROC for adjusted model</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>30-day mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>0.7826 (0.0034)</td>
                <td>0.7646 (0.0043)</td>
                <td>0.7262 (0.0041)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>0.7840 (0.0038)</td>
                <td>0.7667 (0.0045)</td>
                <td>0.7339 (0.0044)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>In-hospital mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>0.7944 (0.0043)</td>
                <td>0.7762 (0.0047)</td>
                <td>0.7439 (0.0041)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>0.7961 (0.0049)</td>
                <td>0.7793 (0.0050)</td>
                <td>0.7536 (0.0045)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Indicators among selected predictors by the adjusted model, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>30-day mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>20 (45)</td>
                <td>16 (48)</td>
                <td>22 (67)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>19 (45)</td>
                <td>16 (52)</td>
                <td>31 (62)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>In-hospital mortality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>HD</td>
                <td>20 (47)</td>
                <td>13 (42)</td>
                <td>16 (64)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>PMM</td>
                <td>18 (50)</td>
                <td>11 (41)</td>
                <td>16 (62)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the curve of the receiver operating characteristic.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>HD: hot deck.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>PMM: predictive mean matching.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The 95% CIs of the area under the curve of the receiver operating characteristic for logistic regression, decision tree, and random forest models on missingness indicators, simplified acute physiology score
-II, and actual variables with and without the missingness indicators.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>The receiver operating characteristic curves for logistic regression 30-day mortality prediction on day 1.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11605_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We used missingness indicators to represent missing information in patient profiles in ICU. The informativeness of these indicators was demonstrated in 3 sets of assessments. First, our exploratory analysis confirms that the missingness of data is associated with patient severity of illness or comorbidities. Afterward, by means of feature selection methods, the predictive power of the presence of an LT in the patient profile was found to be more than the actual measured value. Finally, missingness indicators noticeably improved the performance of mortality prediction models. The high correlation observed among some of the variable indicators suggests that all the variables in a set are typically measured or ordered together. Therefore, if a patient is missing 1 variable of a set, he or she will likely be missing the others as well. This fact is well represented in all 7 groups. The first group comprises the differential WBC counts (BA, MO, NE, eosinophil; EO, and LY), which itemizes the number of basophils, monocytes, neutrophils, eosinophils, and lymphocytes among present WBCs. The second group (RDW, MCHC, MCV, RBC, and MCH) comprises tests that are used to measure the actual number of RBCs and their physical characteristics. The third group (BE, PCO<sub>2</sub>, and PO<sub>2</sub>) consists of blood gas components and focuses on oxygen and carbon dioxide pressure as well as excess or deficit of base levels in the blood. Tbil, ALT, AST, and ALK in the fourth group are liver enzymes [<xref ref-type="bibr" rid="ref65">65</xref>] that are ordered when a patient is suffering from or showing symptoms of a liver-related comorbidity. BUN and Cr mainly focus on kidney function. Bicarbonate; HCO<sub>3</sub> and chloride; Cl are the primary measured anions in the blood. PT along with PTT are used for investigating hemostasis and are the starting points for looking into potential bleeding or clotting complications. Therefore, the presence of a clinical variable in a patient profile can represent a comorbidity in the patient. Although LTs are mainly ordered for diagnostic and prognostic reasons, studies have shown widely diverse test-ordering behavior among clinicians for similar symptoms [<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>]. Therefore, indicators could also reflect the opinions, preconceptions, and biases of the treating clinicians. In other words, by using the missingness indicators, we are learning from practice patterns rather than physiologic patterns. Therefore, indicators as introduced in this study can then be used for modeling health care process in various applications such as clinical care, clinical research, health care economics, and health care policy [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref69">69</xref>].</p>
        <p>Filter methods verified the importance of some indicators with regard to our outcomes. Results also demonstrated that indicators become more and more important on ICU days 2 and 3 (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>). This observation aligns with clinical practice in which ICU clinicians might try to get a complete dataset on day 1 to fully investigate the patient and understand the situation but are likely to be more selective with LT ordering on subsequent days. The Lac indicator was associated with 30-day and in-hospital mortality on the second and third day. Lactate is usually used as a biomarker for shock states. The literature has constantly reported an association between lactate levels and mortality rates among critically ill patients [<xref ref-type="bibr" rid="ref70">70</xref>]. Our study demonstrated that just the presence of this information could represent the severity of a patient’s illness, as patients with profound shock have a very high mortality rate in hospitals and ICUs [<xref ref-type="bibr" rid="ref71">71</xref>]. Moreover, BUN [<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>], RDW [<xref ref-type="bibr" rid="ref75">75</xref>-<xref ref-type="bibr" rid="ref79">79</xref>], and AG [<xref ref-type="bibr" rid="ref80">80</xref>-<xref ref-type="bibr" rid="ref83">83</xref>] have been repeatedly determined as a risk factor of all-cause mortality and their indicators received a high score in our analysis. These results are consistent with those of Agniel et al’s [<xref ref-type="bibr" rid="ref21">21</xref>] who demonstrated that the presence of these tests have significant association with odds of 3-years survival.</p>
        <p>The LASSO model selected indicators among the clinical predictors of in-hospital mortality and 30-day mortality, implying the predictive power of indicators. More indicators than clinical variables were selected on the third day (60%-70% of selected predictors were indicators); the assessment demonstrates that indicators from the third day are more informative than those from the first, again supporting the idea that the practice patterns diverge later during ICU stays, so there is more variability in what gets measured. In other words, care on the first day is likely to be highly protocolized—all patients get the same tests regardless of their condition because their trajectory is still unclear. As time goes on, the patterns become more evident and ordering and prescribing practices change according to clinical need. This high percentage of selected indicators suggests that clinical variables are not always required in outcome prediction; instead, information about their presence would suffice.</p>
        <p>The last assessment demonstrated that models trained on indicators alone in some scenarios have reasonable performance (for instance, in 30-day mortality prediction with LR, we achieved AUROC of 0.6836 [0.012]). These results imply that by considering missing data as noise or a random artifact, we can lose valuable information about patient outcomes. Moreover, indicators improved the AUROCs in most scenarios. Researchers in this field are looking for predictors that can be included in the models to improve the prediction results. Having a low-dimensional set of typical predictors plus these missing data indicators can actually lead to performance comparable with that achieved using typical predictors plus other potentially useful predictors identified a priori by medical researchers: First, in comparison with including extra numeric predictors, the computational load for performing mathematical calculations on binary values such as indicators is usually less. Second, binary data require less computational memory than numbers when performing data mining techniques. Finally, for some important clinical variables, storing the missing data indicators instead of the actual value better protects patient privacy while preserving predictive power. In other words, less privacy concern is expected in a situation when the type of test is disclosed rather than the actual test result. The comparative analyses on the predictive models showed that missing data indicators could improve the prediction models’ performance. Although literature considers a small increase (0.01) in AUROC meaningful and of clinical interest (because of insensitivity of AUROC) [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>], including the indicators in our study could improve the average AUROC by 0.0511. Thus, missing data indicators can be introduced as informative predictors and be used to learn from. In other words, these indicators can be representative of physicians’ and patients’ opinions during the health care process. Furthermore, the overall model performance decreased over time perhaps implying that patients’ data on the first 24-hour has the highest level of information. The same pattern was also observed in the previous assessment. According to these observations, we can infer that presence or absence of a variable can be used in predicting patients’ severity of illness.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations of the Project</title>
        <p>A significant strength of this study is its new insight on missing data in a real-world ICU database. The results confirm the predictive power of some indicators and their advantage over actual values in predictive modeling. The findings further clarify the factors associated with lack of data collection such as the healthier status of a patient or practice patterns of clinicians. These insights, in turn, can be used to design models that consider missing data and benefit from the hidden information. On the basis of our results, missingness indicators can be introduced as potential predictors of ICU patients’ outcome.</p>
        <p>Despite the strength, significance, and novel nature of this study, there also exist limitations that cannot be overlooked. First, because of the nature of ICUs, the amount of missing data in MIMIC is less than that from a general ward. Therefore, our study may not fully demonstrate the informativeness of these indicators. Moreover, adding the indicators of interest to the actual data matrix increases the dimension of the matrix and may become computationally burdensome. Using other imputation methods, the power of missing data indicators may vary but this was beyond the scope of our study, which focused on providing evidence on missing data informativeness.</p>
      </sec>
      <sec>
        <title>Perspectives for Future Work</title>
        <p>Although our study demonstrates that missingness indicators are informative and have predictive power in mortality prediction in ICU, further studies are required to investigate their power in predicting other clinical outcomes. Future researchers can investigate the association between missingness patterns and patient diagnosis. They can also consider more sensitive criteria such as net reclassification or integrated discrimination improvements while preserving improvement in the AUROC as the first criterion. Moreover, as this study looked at the 3 days in the ICU independently, one can investigate if the missing data on a particular day are still informative given all the clinical and indicator variables from previous days. These future studies should also investigate the effect of missing rate on the predictive power of indicators. Another area of future work is examining the test-ordering behavior among clinicians, by using missingness indicators.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our study has demonstrated that the missingness of data itself might be informative in ICU and might have added predictive value beyond observed data alone. Moreover, indicators for variables with higher missingness rates had more predictive power. In practice, the lack of a set of symptoms might lead health professionals to conclude that a particular set of tests is not required at the current stage. Therefore, these missing data are not a random occurrence. This study showed that the number of comorbidities is associated with a decreased rate of missing data. Therefore, rudimentary treatments of missing data (eg, CCA) can cause bias toward sicker patients. The study is also notable because it provided new insight about the informativeness of missing data and described how this information could be used in predicting mortality.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Detailed results.</p>
        <media xlink:href="medinform_v7i1e11605_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 165 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACA</term>
          <def>
            <p>available case analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AG</term>
          <def>
            <p>anion gap</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ALK</term>
          <def>
            <p>alkaline phosphatase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ALT</term>
          <def>
            <p>alanine aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ASA</term>
          <def>
            <p>anesthesiologists physical status</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">AST</term>
          <def>
            <p>aspartate aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">AUROC</term>
          <def>
            <p>area under the curve of the receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">BA</term>
          <def>
            <p>basophils</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">BE</term>
          <def>
            <p>base excess</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">BG</term>
          <def>
            <p>blood glucose</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">BUN</term>
          <def>
            <p>blood urea nitrogen</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">Ca</term>
          <def>
            <p>calcium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">CCA</term>
          <def>
            <p>complete case analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">Cl</term>
          <def>
            <p>chloride</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">CP</term>
          <def>
            <p>complexity parameter</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">Cr</term>
          <def>
            <p>creatinine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">DT</term>
          <def>
            <p>decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">ECI</term>
          <def>
            <p>Elixhauser Comorbidity Index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">EO</term>
          <def>
            <p>eosinophils</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">FiO<sub>2</sub></term>
          <def>
            <p>fraction of inspired oxygen</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb22">HCO <sub>3</sub></term>
          <def>
            <p>bicarbonate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb23">HCT</term>
          <def>
            <p>hematocrit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb24">HD</term>
          <def>
            <p>hot deck</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb25">HGB</term>
          <def>
            <p>hemoglobin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb26">ICU</term>
          <def>
            <p>intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb27">InfGain</term>
          <def>
            <p>information gain</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb28">K</term>
          <def>
            <p>potassium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb29">Lac</term>
          <def>
            <p>lactate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb30">LASSO</term>
          <def>
            <p>least absolute shrinkage and selection operator</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb31">LR</term>
          <def>
            <p>logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb32">LT</term>
          <def>
            <p>laboratory test</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb33">LY</term>
          <def>
            <p>lymphocytes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb34">MAR</term>
          <def>
            <p>missing at random</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb35">MCAR</term>
          <def>
            <p>missing completely at random</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb36">MCH</term>
          <def>
            <p>mean corpuscular hemoglobin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb37">MCHC</term>
          <def>
            <p>mean corpuscular hemoglobin concentration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb38">MCV</term>
          <def>
            <p>mean corpuscular volume</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb39">Mg</term>
          <def>
            <p>magnesium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb40">MIMIC</term>
          <def>
            <p>Medical Information Mart for Intensive Care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb41">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb42">MO</term>
          <def>
            <p>monocytes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb43">Na</term>
          <def>
            <p>sodium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb44">NE</term>
          <def>
            <p>neutrophils</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb45">PaO<sub>2</sub></term>
          <def>
            <p>partial pressure of oxygen in the arterial blood</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb46">PCO<sub>2</sub></term>
          <def>
            <p>partial pressure of carbon dioxide</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb47">Phos</term>
          <def>
            <p>phosphate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb48">PLT</term>
          <def>
            <p>platelet count</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb49">PMM</term>
          <def>
            <p>predictive mean matching</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb50">PO<sub>2</sub></term>
          <def>
            <p>partial pressure of oxygen</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb51">PT</term>
          <def>
            <p>prothrombin time</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb52">PTT</term>
          <def>
            <p>partial thromboplastin time</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb53">RBC</term>
          <def>
            <p>red blood cell</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb54">RDW</term>
          <def>
            <p>red cell distribution width</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb55">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb56">SAPS-II</term>
          <def>
            <p>Simplified Acute Physiology Score II</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb57">TBil</term>
          <def>
            <p>total bilirubin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb58">WBC</term>
          <def>
            <p>white blood cell</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the Natural Sciences and Engineering Research Council of Canada (NSERC) Discovery Grant (RGPIN-2014-04743, RGPIN-2014-05911) and Early Researcher Award (Ministry of Research and Innovation, Government of Ontario).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>Study conception and design were conducted by AS, JAD, DMM, and JL. AS extracted data and performed the data analysis. Interpretation of the results was provided by all authors. All authors contributed in writing the paper and approved the final version of the review.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>1</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&amp;pmid=22733976"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="medline">22733976</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Fowles</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Review: electronic health records and the reliability and validity of quality measures: a review of the literature</article-title>
          <source>Med Care Res Rev</source>
          <year>2010</year>
          <month>10</month>
          <volume>67</volume>
          <issue>5</issue>
          <fpage>503</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1177/1077558709359007</pub-id>
          <pub-id pub-id-type="medline">20150441</pub-id>
          <pub-id pub-id-type="pii">1077558709359007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Swaminathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Defining and measuring completeness of electronic health records for secondary use</article-title>
          <source>J Biomed Inform</source>
          <year>2013</year>
          <month>10</month>
          <volume>46</volume>
          <issue>5</issue>
          <fpage>830</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00085-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2013.06.010</pub-id>
          <pub-id pub-id-type="medline">23820016</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(13)00085-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC3810243</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chagin</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Nowacki</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>MW</given-names>
            </name>
          </person-group>
          <article-title>Strategies for handling missing data in electronic health record derived data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2013</year>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>1035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25848578"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1035</pub-id>
          <pub-id pub-id-type="medline">25848578</pub-id>
          <pub-id pub-id-type="pii">egems1035</pub-id>
          <pub-id pub-id-type="pmcid">PMC4371484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Dickersin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Emerson</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Farrar</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Frangakis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Molenberghs</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Neaton</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Rotnitzky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Scharfstein</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Stern</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The prevention and treatment of missing data in clinical trials</article-title>
          <source>N Engl J Med</source>
          <year>2012</year>
          <month>10</month>
          <day>4</day>
          <volume>367</volume>
          <issue>14</issue>
          <fpage>1355</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23034025"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMsr1203730</pub-id>
          <pub-id pub-id-type="medline">23034025</pub-id>
          <pub-id pub-id-type="pmcid">PMC3771340</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sterne</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>IR</given-names>
            </name>
            <name name-style="western">
              <surname>Carlin</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Spratt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Royston</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kenward</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Carpenter</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Multiple imputation for missing data in epidemiological and clinical research: potential and pitfalls</article-title>
          <source>Br Med J</source>
          <year>2009</year>
          <volume>338</volume>
          <fpage>b2393</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19564179"/>
          </comment>
          <pub-id pub-id-type="medline">19564179</pub-id>
          <pub-id pub-id-type="pmcid">PMC2714692</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haukoos</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Newgard</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Advanced statistics: missing data in clinical research--part 1: an introduction and conceptual framework</article-title>
          <source>Acad Emerg Med</source>
          <year>2007</year>
          <month>07</month>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>662</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://onlinelibrary.wiley.com/resolve/openurl?genre=article&amp;sid=nlm:pubmed&amp;issn=1069-6563&amp;date=2007&amp;volume=14&amp;issue=7&amp;spage=662"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/j.aem.2006.11.037</pub-id>
          <pub-id pub-id-type="medline">17538078</pub-id>
          <pub-id pub-id-type="pii">j.aem.2006.11.037</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newgard</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Haukoos</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Advanced statistics: missing data in clinical research--part 2: multiple imputation</article-title>
          <source>Acad Emerg Med</source>
          <year>2007</year>
          <month>07</month>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>669</fpage>
          <lpage>78</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://onlinelibrary.wiley.com/resolve/openurl?genre=article&amp;sid=nlm:pubmed&amp;issn=1069-6563&amp;date=2007&amp;volume=14&amp;issue=7&amp;spage=669"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/j.aem.2006.11.038</pub-id>
          <pub-id pub-id-type="medline">17595237</pub-id>
          <pub-id pub-id-type="pii">j.aem.2006.11.038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pringle</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chilvers</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Assessment of the completeness and accuracy of computer medical records in four practices committed to recording data on computer</article-title>
          <source>Br J Gen Pract</source>
          <year>1995</year>
          <month>10</month>
          <volume>45</volume>
          <issue>399</issue>
          <fpage>537</fpage>
          <lpage>41</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bjgp.org/cgi/pmidlookup?view=long&amp;pmid=7492423"/>
          </comment>
          <pub-id pub-id-type="medline">7492423</pub-id>
          <pub-id pub-id-type="pmcid">PMC1239405</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thiru</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>de Lusignan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hague</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Have the completeness and accuracy of computer medical records in general practice improved in the last five years? The report of a two-practice pilot study</article-title>
          <source>Health Informatics J</source>
          <year>2016</year>
          <month>07</month>
          <day>25</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>224</fpage>
          <lpage>232</lpage>
          <pub-id pub-id-type="doi">10.1177/146045829900500410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Forster</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkhof</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Graber</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Boulle</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Spohr</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Balestre</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>May</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Keiser</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Jahn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Egger</surname>
              <given-names>M</given-names>
            </name>
            <collab>ART-LINC collaboration of International Epidemiological Databases to Evaluate AIDS</collab>
          </person-group>
          <article-title>Electronic medical record systems, data quality and loss to follow-up: survey of antiretroviral therapy programmes in resource-limited settings</article-title>
          <source>Bull World Health Organ</source>
          <year>2008</year>
          <month>12</month>
          <volume>86</volume>
          <issue>12</issue>
          <fpage>939</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.scielosp.org/scielo.php?script=sci_arttext&amp;pid=S0042-96862008001200011&amp;lng=en&amp;nrm=iso&amp;tlng=en"/>
          </comment>
          <pub-id pub-id-type="medline">19142294</pub-id>
          <pub-id pub-id-type="pii">S0042-96862008001200011</pub-id>
          <pub-id pub-id-type="pmcid">PMC2649575</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Hedley</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>A computer in the diabetic clinic. Completeness of data in a clinical information system for diabetes</article-title>
          <source>Pract Diab Int</source>
          <year>1986</year>
          <month>11</month>
          <volume>3</volume>
          <issue>6</issue>
          <fpage>295</fpage>
          <lpage>296</lpage>
          <pub-id pub-id-type="doi">10.1002/pdi.1960030610</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Porcheret</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehurst</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ogden</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Croft</surname>
              <given-names>P</given-names>
            </name>
            <collab>North Staffordshire General Practice Research Network</collab>
          </person-group>
          <article-title>Data quality of general practice electronic health records: the impact of a program of assessments, feedback, and training</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2004</year>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>78</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14527973"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1362</pub-id>
          <pub-id pub-id-type="medline">14527973</pub-id>
          <pub-id pub-id-type="pii">M1362</pub-id>
          <pub-id pub-id-type="pmcid">PMC305461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Soto</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinman</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>SR</given-names>
            </name>
          </person-group>
          <article-title>Quality and correlates of medical record documentation in the ambulatory care setting</article-title>
          <source>BMC Health Serv Res</source>
          <year>2002</year>
          <month>12</month>
          <day>10</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12473161"/>
          </comment>
          <pub-id pub-id-type="medline">12473161</pub-id>
          <pub-id pub-id-type="pmcid">PMC140026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>LaRosa</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Gorden</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Use of computer-based records, completeness of documentation, and appropriateness of documented clinical decisions</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>1999</year>
          <month>05</month>
          <day>01</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>245</fpage>
          <lpage>251</lpage>
          <pub-id pub-id-type="doi">10.1136/jamia.1999.0060245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Fowles</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Neale</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Implementing electronic health record-based quality measures for developmental screening</article-title>
          <source>Pediatrics</source>
          <year>2009</year>
          <month>10</month>
          <volume>124</volume>
          <issue>4</issue>
          <fpage>e648</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1542/peds.2008-3091</pub-id>
          <pub-id pub-id-type="medline">19786425</pub-id>
          <pub-id pub-id-type="pii">peds.2008-3091</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Botsis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hartvigsen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Secondary use of EHR: data quality issues and informatics opportunities</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2010</year>
          <month>03</month>
          <day>01</day>
          <volume>2010</volume>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21347133"/>
          </comment>
          <pub-id pub-id-type="medline">21347133</pub-id>
          <pub-id pub-id-type="pmcid">PMC3041534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharafoddini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dubin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Patient similarity in prediction models based on health data: a scoping review</article-title>
          <source>JMIR Med Inform</source>
          <year>2017</year>
          <month>03</month>
          <day>03</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e7</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://medinform.jmir.org/2017/1/e7/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.6730</pub-id>
          <pub-id pub-id-type="medline">28258046</pub-id>
          <pub-id pub-id-type="pii">v5i1e7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5357318</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Hidden in plain sight: bias towards sick patients when sampling patients with sufficient electronic health record data for research</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2014</year>
          <month>06</month>
          <day>11</day>
          <volume>14</volume>
          <fpage>51</fpage>
          <pub-id pub-id-type="doi">10.1186/1472-6947-14-51</pub-id>
          <pub-id pub-id-type="medline">24916006</pub-id>
          <pub-id pub-id-type="pii">1472-6947-14-51</pub-id>
          <pub-id pub-id-type="pmcid">PMC4062889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Sick patients have more data: the non-random completeness of electronic health records</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2013</year>
          <volume>2013</volume>
          <fpage>1472</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24551421"/>
          </comment>
          <pub-id pub-id-type="medline">24551421</pub-id>
          <pub-id pub-id-type="pmcid">PMC3900159</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agniel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Biases in electronic health record data due to processes within the healthcare system: retrospective observational study</article-title>
          <source>Br Med J</source>
          <year>2018</year>
          <month>12</month>
          <day>30</day>
          <volume>361</volume>
          <fpage>k1479</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&amp;pmid=29712648"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.k1479</pub-id>
          <pub-id pub-id-type="medline">29712648</pub-id>
          <pub-id pub-id-type="pmcid">PMC5925441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>Applied Predictive Modeling</source>
          <year>2013</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Maslove</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Using information theory to identify redundancy in common laboratory tests in the intensive care unit</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2015</year>
          <month>07</month>
          <day>31</day>
          <volume>15</volume>
          <fpage>59</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-015-0187-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-015-0187-x</pub-id>
          <pub-id pub-id-type="medline">26227625</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-015-0187-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC4521317</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Souza</surname>
              <given-names>CL</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of unnecessary laboratory tests and related avoidable costs in intensive care unit</article-title>
          <source>J Bras Patol Med Lab</source>
          <year>2014</year>
          <volume>50</volume>
          <fpage>410</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.5935/1676-2444.20140049</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cismondi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Fialho</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Vieira</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Reti</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Sousa</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Finkelstein</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Reducing unnecessary lab testing in the ICU with artificial intelligence</article-title>
          <source>Int J Med Inform</source>
          <year>2013</year>
          <month>05</month>
          <volume>82</volume>
          <issue>5</issue>
          <fpage>345</fpage>
          <lpage>58</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23273628"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2012.11.017</pub-id>
          <pub-id pub-id-type="medline">23273628</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(12)00242-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5694620</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rothwell</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>External validity of randomised controlled trials: “to whom do the results of this trial apply?”</article-title>
          <source>Lancet</source>
          <year>2005</year>
          <volume>365</volume>
          <issue>9453</issue>
          <fpage>82</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(04)17670-8</pub-id>
          <pub-id pub-id-type="medline">15639683</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(04)17670-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doyle</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Garmon</surname>
              <given-names>EH</given-names>
            </name>
          </person-group>
          <article-title>American Society of Anesthesiologists Classification (ASA Class)</article-title>
          <source>StatPearls</source>
          <year>2018</year>
          <pub-id pub-id-type="medline">28722969</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vesin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Azoulay</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ruckly</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vignoud</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rusinovà</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Soares</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Azeivedo-Maia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Abroug</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Benbenishty</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Timsit</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Reporting and handling missing values in clinical studies in intensive care units</article-title>
          <source>Intensive Care Med</source>
          <year>2013</year>
          <month>08</month>
          <volume>39</volume>
          <issue>8</issue>
          <fpage>1396</fpage>
          <lpage>404</lpage>
          <pub-id pub-id-type="doi">10.1007/s00134-013-2949-1</pub-id>
          <pub-id pub-id-type="medline">23685609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fitzmaurice</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Laird</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Ware</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <source>Applied Longitudinal Analysis</source>
          <year>2011</year>
          <publisher-loc>Hoboken, New Jersey</publisher-loc>
          <publisher-name>Wiley</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baraldi</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Enders</surname>
              <given-names>CK</given-names>
            </name>
          </person-group>
          <article-title>An introduction to modern missing data analyses</article-title>
          <source>J Sch Psychol</source>
          <year>2010</year>
          <month>02</month>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jsp.2009.10.001</pub-id>
          <pub-id pub-id-type="medline">20006986</pub-id>
          <pub-id pub-id-type="pii">S0022-4405(09)00066-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stockdale</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Royal</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Missing data as a validity threat for medical and healthcare education research: problems and solutions</article-title>
          <source>Int J Health Care</source>
          <year>2016</year>
          <month>06</month>
          <day>23</day>
          <volume>2</volume>
          <issue>2</issue>
          <pub-id pub-id-type="doi">10.5430/ijh.v2n2p67</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Goodbye, listwise deletion: presenting hot deck imputation as an easy and effective tool for handling missing data</article-title>
          <source>Communication Methods and Measures</source>
          <year>2011</year>
          <month>10</month>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>297</fpage>
          <lpage>310</lpage>
          <pub-id pub-id-type="doi">10.1080/19312458.2011.624490</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pigott</surname>
              <given-names>TD</given-names>
            </name>
          </person-group>
          <article-title>A review of methods for missing data</article-title>
          <source>Educ Res Eval</source>
          <year>2001</year>
          <month>12</month>
          <day>1</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>353</fpage>
          <lpage>383</lpage>
          <pub-id pub-id-type="doi">10.1076/edre.7.4.353.8937</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>PL</given-names>
            </name>
          </person-group>
          <article-title>Missing data - a conceptual review for applied psychologists</article-title>
          <source>Pers Psychol</source>
          <year>1994</year>
          <volume>47</volume>
          <issue>3</issue>
          <fpage>537</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1744-6570.1994.tb01736.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gorelick</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Bias arising from missing data in predictive models</article-title>
          <source>J Clin Epidemiol</source>
          <year>2006</year>
          <month>10</month>
          <volume>59</volume>
          <issue>10</issue>
          <fpage>1115</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2004.11.029</pub-id>
          <pub-id pub-id-type="medline">16980153</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(06)00264-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Staul</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Standards for frequency of measurement and documentation of vital signs and physical assessments</article-title>
          <source>Crit Care Nurse</source>
          <year>2010</year>
          <month>06</month>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>74</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ccn.aacnjournals.org/cgi/pmidlookup?view=long&amp;pmid=20515885"/>
          </comment>
          <pub-id pub-id-type="doi">10.4037/ccn2010406</pub-id>
          <pub-id pub-id-type="medline">20515885</pub-id>
          <pub-id pub-id-type="pii">30/3/74</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asiimwe</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Okello</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Frequency of vital signs monitoring and its association with mortality among adults with severe sepsis admitted to a general medical ward in Uganda</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e89879</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0089879"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0089879</pub-id>
          <pub-id pub-id-type="medline">24587094</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-40290</pub-id>
          <pub-id pub-id-type="pmcid">PMC3938537</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cardona-Morrell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nicholson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hillman</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Vital Signs: From Monitoring to Prevention of Deterioration in General Wards</article-title>
          <source>Annual Update In Intensive Care And Emergency Medicine 2015</source>
          <year>2018</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Frassica</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Frequency of laboratory test utilization in the intensive care unit and its implications for large scale data collection efforts</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>844</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728349"/>
          </comment>
          <pub-id pub-id-type="medline">14728349</pub-id>
          <pub-id pub-id-type="pii">D030002804</pub-id>
          <pub-id pub-id-type="pmcid">PMC1480287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harrell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbri</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Evaluating EHR Data Availability for Cohort Selection in Retrospective Studies</article-title>
          <year>2016</year>
          <conf-name>IEEE International Conference on Healthcare Informatics (ICHI)</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>Chicago, IL, USA</conf-loc>
          <fpage>4</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1109/ICHI.2016.68</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Missing-data adjustments in large surveys</article-title>
          <source>J Bus Econ Stat</source>
          <year>1988</year>
          <month>07</month>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>287</fpage>
          <lpage>296</lpage>
          <pub-id pub-id-type="doi">10.1080/07350015.1988.10509663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>XH</given-names>
            </name>
            <name name-style="western">
              <surname>Eckert</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tierney</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Multiple imputation in public health research</article-title>
          <source>Stat Med</source>
          <year>2001</year>
          <volume>20</volume>
          <issue>9-10</issue>
          <fpage>1541</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="medline">11343373</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Buuren</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <source>Flexible Imputation Of Missing Data</source>
          <year>2018</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Chapman and Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andridge</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>A review of hot deck imputation for survey non-response</article-title>
          <source>Int Stat Rev</source>
          <year>2010</year>
          <month>04</month>
          <volume>78</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21743766"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1751-5823.2010.00103.x</pub-id>
          <pub-id pub-id-type="medline">21743766</pub-id>
          <pub-id pub-id-type="pmcid">PMC3130338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Missing data: a review of current methods and applications in epidemiological research</article-title>
          <source>Curr Opin Psychiatr</source>
          <year>2004</year>
          <month>07</month>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>315</fpage>
          <lpage>321</lpage>
          <pub-id pub-id-type="doi">10.1097/01.yco.0000133836.34543.7e</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Groenwold</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>IR</given-names>
            </name>
            <name name-style="western">
              <surname>Donders</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Carpenter</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KG</given-names>
            </name>
          </person-group>
          <article-title>Missing covariate data in clinical research: when and when not to use the missing-indicator method for analysis</article-title>
          <source>Can Med Assoc J</source>
          <year>2012</year>
          <month>08</month>
          <day>07</day>
          <volume>184</volume>
          <issue>11</issue>
          <fpage>1265</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cmaj.ca/cgi/pmidlookup?view=long&amp;pmid=22371511"/>
          </comment>
          <pub-id pub-id-type="doi">10.1503/cmaj.110977</pub-id>
          <pub-id pub-id-type="medline">22371511</pub-id>
          <pub-id pub-id-type="pii">cmaj.110977</pub-id>
          <pub-id pub-id-type="pmcid">PMC3414599</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Knol</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Janssen</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Donders</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Egberts</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Heerdink</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Grobbee</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Geerlings</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Unpredictable bias when using the missing indicator method or complete case analysis for missing confounder values: an empirical example</article-title>
          <source>J Clin Epidemiol</source>
          <year>2010</year>
          <month>07</month>
          <volume>63</volume>
          <issue>7</issue>
          <fpage>728</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2009.08.028</pub-id>
          <pub-id pub-id-type="medline">20346625</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(10)00018-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Clinical Prediction Models: A Practical Approach to Development, Validation, and Updating</source>
          <year>2008</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Springer-Verlag</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elixhauser</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Coffey</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Comorbidity measures for use with administrative data</article-title>
          <source>Med Care</source>
          <year>1998</year>
          <month>01</month>
          <volume>36</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="medline">9431328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Charlson</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Pompei</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ales</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>MacKenzie</surname>
              <given-names>CR</given-names>
            </name>
          </person-group>
          <article-title>A new method of classifying prognostic comorbidity in longitudinal studies: development and validation</article-title>
          <source>J Chronic Dis</source>
          <year>1987</year>
          <volume>40</volume>
          <issue>5</issue>
          <fpage>373</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="medline">3558716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menendez</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Neuhaus</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>van Dijk</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Ring</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The Elixhauser comorbidity method outperforms the Charlson index in predicting inpatient death after orthopaedic surgery</article-title>
          <source>Clin Orthop Relat Res</source>
          <year>2014</year>
          <month>09</month>
          <volume>472</volume>
          <issue>9</issue>
          <fpage>2878</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24867450"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11999-014-3686-7</pub-id>
          <pub-id pub-id-type="medline">24867450</pub-id>
          <pub-id pub-id-type="pmcid">PMC4117875</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Southern</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ghali</surname>
              <given-names>WA</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the Elixhauser and Charlson/Deyo methods of comorbidity measurement in administrative data</article-title>
          <source>Med Care</source>
          <year>2004</year>
          <month>04</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>355</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="medline">15076812</pub-id>
          <pub-id pub-id-type="pii">00005650-200404000-00008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farley</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Harley</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Devine</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>A comparison of comorbidity measurements to predict healthcare expenditures</article-title>
          <source>Am J Manag Care</source>
          <year>2006</year>
          <month>02</month>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>110</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ajmc.com/pubMed.php?pii=3081"/>
          </comment>
          <pub-id pub-id-type="medline">16464140</pub-id>
          <pub-id pub-id-type="pii">3081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharabiani</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Aylin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bottle</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Systematic review of comorbidity indices for administrative data</article-title>
          <source>Med Care</source>
          <year>2012</year>
          <month>12</month>
          <volume>50</volume>
          <issue>12</issue>
          <fpage>1109</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e31825f64d0</pub-id>
          <pub-id pub-id-type="medline">22929993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Le Gall</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Lemeshow</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saulnier</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>A new Simplified Acute Physiology Score (SAPS II) based on a European/North American multicenter study</article-title>
          <source>J Am Med Assoc</source>
          <year>1993</year>
          <volume>270</volume>
          <issue>24</issue>
          <fpage>2957</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="medline">8254858</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeys</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Inza</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Larrañaga</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A review of feature selection techniques in bioinformatics</article-title>
          <source>Bioinformatics</source>
          <year>2007</year>
          <month>10</month>
          <day>1</day>
          <volume>23</volume>
          <issue>19</issue>
          <fpage>2507</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bioinformatics.oxfordjournals.org/cgi/pmidlookup?view=long&amp;pmid=17720704"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btm344</pub-id>
          <pub-id pub-id-type="medline">17720704</pub-id>
          <pub-id pub-id-type="pii">btm344</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robnik-Sikonja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kononenko</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Theoretical and empirical analysis of ReliefF and RReliefF</article-title>
          <source>Mach Learn</source>
          <year>2003</year>
          <volume>53</volume>
          <issue>1-2</issue>
          <fpage>23</fpage>
          <lpage>69</lpage>
          <pub-id pub-id-type="doi">10.1023/A:1025667309714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Feature selection based on mutual information: criteria of max-dependency, max-relevance, and min-redundancy</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2005</year>
          <month>08</month>
          <volume>27</volume>
          <issue>8</issue>
          <fpage>1226</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2005.159</pub-id>
          <pub-id pub-id-type="medline">16119262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>Machine Learning</source>
          <year>1997</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>McGraw-Hill Education</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <source>Data Classification: Algorithms And Applications</source>
          <year>2018</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Chapman and Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martens</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Tonk</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Kers</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Janssens</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Small improvement in the area under the receiver operating characteristic curve indicated small changes in predicted risks</article-title>
          <source>J Clin Epidemiol</source>
          <year>2016</year>
          <month>11</month>
          <volume>79</volume>
          <fpage>159</fpage>
          <lpage>164</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2016.07.002</pub-id>
          <pub-id pub-id-type="medline">27430730</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(16)30194-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>NR</given-names>
            </name>
          </person-group>
          <article-title>Response to letters regarding article, “use and misuse of the receiver operating characteristic curve in risk prediction”</article-title>
          <source>Circulation</source>
          <year>2007</year>
          <month>08</month>
          <day>07</day>
          <volume>116</volume>
          <issue>6</issue>
          <fpage>e134</fpage>
          <lpage>e134</lpage>
          <pub-id pub-id-type="doi">10.1161/Circulationaha.107.715359</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pencina</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Pencina</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Janssens</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Greenland</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Interpreting incremental value of markers added to risk prediction models</article-title>
          <source>Am J Epidemiol</source>
          <year>2012</year>
          <month>09</month>
          <day>15</day>
          <volume>176</volume>
          <issue>6</issue>
          <fpage>473</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22875755"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kws207</pub-id>
          <pub-id pub-id-type="medline">22875755</pub-id>
          <pub-id pub-id-type="pii">kws207</pub-id>
          <pub-id pub-id-type="pmcid">PMC3530349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gowda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Hull</surname>
              <given-names>VV</given-names>
            </name>
            <name name-style="western">
              <surname>Math</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Vernekar</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>A review on laboratory liver function tests</article-title>
          <source>Pan Afr Med J</source>
          <year>2009</year>
          <month>11</month>
          <day>22</day>
          <volume>3</volume>
          <fpage>17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.panafrican-med-journal.com/content/article/3/17/full/"/>
          </comment>
          <pub-id pub-id-type="medline">21532726</pub-id>
          <pub-id pub-id-type="pmcid">PMC2984286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wennberg</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Dealing with medical practice variations: a proposal for action</article-title>
          <source>Health Aff (Millwood)</source>
          <year>1984</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>6</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="medline">6432667</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daniels</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schroeder</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Variation among Physicians in Use of Laboratory Tests II. Relation to Clinical Productivity and Outcomes of Care</article-title>
          <source>Medical Care</source>
          <year>1977</year>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>482</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.1097/00005650-197706000-00004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Hashimoto</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Daltroy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Techniques to improve physicians' use of diagnostic tests: a new conceptual framework</article-title>
          <source>J Am Med Assoc</source>
          <year>1998</year>
          <month>12</month>
          <day>16</day>
          <volume>280</volume>
          <issue>23</issue>
          <fpage>2020</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="medline">9863854</pub-id>
          <pub-id pub-id-type="pii">jrv80056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharafoddini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dubin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Finding Similar Patient Subpopulations in the ICU Using Laboratory Test Ordering Patterns</article-title>
          <source>Proceedings of the 2018 7th International Conference on Bioinformatics and Biomedical Science</source>
          <year>2018</year>
          <conf-name>2018 7th International Conferenceon Bioinformatics and Biomedical Science</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Shenzhen, China</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3239264.3239277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Lactate clearance is a useful biomarker for the prediction of all-cause mortality in critically ill patients: a systematic review and meta-analysis*</article-title>
          <source>Crit Care Med</source>
          <year>2014</year>
          <month>09</month>
          <volume>42</volume>
          <issue>9</issue>
          <fpage>2118</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000000405</pub-id>
          <pub-id pub-id-type="medline">24797375</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Casserly</surname>
              <given-names>BP</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Reducing mortality in severe sepsis and septic shock</article-title>
          <source>Semin Respir Crit Care Med</source>
          <year>2011</year>
          <month>04</month>
          <volume>32</volume>
          <issue>2</issue>
          <fpage>195</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.1055/s-0031-1275532</pub-id>
          <pub-id pub-id-type="medline">21506056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beier</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Eppanapally</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bazick</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mahadevappa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbons</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Christopher</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <article-title>Elevation of blood urea nitrogen is predictive of long-term mortality in critically ill patients independent of “normal” creatinine</article-title>
          <source>Crit Care Med</source>
          <year>2011</year>
          <month>02</month>
          <volume>39</volume>
          <issue>2</issue>
          <fpage>305</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21099426"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0b013e3181ffe22a</pub-id>
          <pub-id pub-id-type="medline">21099426</pub-id>
          <pub-id pub-id-type="pmcid">PMC3448784</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cauthen</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Lipinski</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Abbate</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Appleton</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nusca</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Varma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goudreau</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Cowley</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vetrovec</surname>
              <given-names>GW</given-names>
            </name>
          </person-group>
          <article-title>Relation of blood urea nitrogen to long-term mortality in patients with heart failure</article-title>
          <source>Am J Cardiol</source>
          <year>2008</year>
          <month>06</month>
          <day>01</day>
          <volume>101</volume>
          <issue>11</issue>
          <fpage>1643</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjcard.2008.01.047</pub-id>
          <pub-id pub-id-type="medline">18489944</pub-id>
          <pub-id pub-id-type="pii">S0002-9149(08)00256-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kajimoto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sato</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Takano</surname>
              <given-names>T</given-names>
            </name>
            <collab>Investigators of the Acute Decompensated Heart Failure Syndromes (ATTEND) registry</collab>
          </person-group>
          <article-title>Relation between elevated blood urea nitrogen, clinical features or comorbidities, and clinical outcome in patients hospitalized for acute heart failure syndromes</article-title>
          <source>Int J Cardiol</source>
          <year>2015</year>
          <month>12</month>
          <day>15</day>
          <volume>201</volume>
          <fpage>311</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijcard.2015.08.061</pub-id>
          <pub-id pub-id-type="medline">26301667</pub-id>
          <pub-id pub-id-type="pii">S0167-5273(15)30292-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bazick</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mahadevappa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbons</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Christopher</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <article-title>Red cell distribution width and all-cause mortality in critically ill patients</article-title>
          <source>Crit Care Med</source>
          <year>2011</year>
          <month>08</month>
          <volume>39</volume>
          <issue>8</issue>
          <fpage>1913</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21532476"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0b013e31821b85c6</pub-id>
          <pub-id pub-id-type="medline">21532476</pub-id>
          <pub-id pub-id-type="pmcid">PMC4427349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hunziker</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Red cell distribution width improves the simplified acute physiology score for risk prediction in unselected critically ill patients</article-title>
          <source>Crit Care</source>
          <year>2012</year>
          <month>05</month>
          <day>18</day>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>R89</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ccforum.biomedcentral.com/articles/10.1186/cc11351"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/cc11351</pub-id>
          <pub-id pub-id-type="medline">22607685</pub-id>
          <pub-id pub-id-type="pii">cc11351</pub-id>
          <pub-id pub-id-type="pmcid">PMC3580634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>KV</given-names>
            </name>
            <name name-style="western">
              <surname>Semba</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrucci</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Fried</surname>
              <given-names>LP</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Bandinelli</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Connelly</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shlipak</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Chaves</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Launer</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ershler</surname>
              <given-names>WB</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Longo</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Guralnik</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Red cell distribution width and mortality in older adults: a meta-analysis</article-title>
          <source>J Gerontol A Biol Sci Med Sci</source>
          <year>2010</year>
          <month>03</month>
          <volume>65</volume>
          <issue>3</issue>
          <fpage>258</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19880817"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/gerona/glp163</pub-id>
          <pub-id pub-id-type="medline">19880817</pub-id>
          <pub-id pub-id-type="pii">glp163</pub-id>
          <pub-id pub-id-type="pmcid">PMC2822283</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Purtle</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Moromizato</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McKane</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbons</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Christopher</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <article-title>The association of red cell distribution width at hospital discharge and out-of-hospital mortality following critical illness*</article-title>
          <source>Crit Care Med</source>
          <year>2014</year>
          <month>04</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>918</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000000118</pub-id>
          <pub-id pub-id-type="medline">24448196</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Şenol</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Saylam</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kocaay</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Tez</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Red cell distribution width as a predictor of mortality in acute pancreatitis</article-title>
          <source>Am J Emerg Med</source>
          <year>2013</year>
          <month>04</month>
          <volume>31</volume>
          <issue>4</issue>
          <fpage>687</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ajem.2012.12.015</pub-id>
          <pub-id pub-id-type="medline">23399348</pub-id>
          <pub-id pub-id-type="pii">S0735-6757(12)00654-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baek</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Na</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Chae</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Serum anion gap is predictive of mortality in an elderly population</article-title>
          <source>Exp Gerontol</source>
          <year>2014</year>
          <month>02</month>
          <volume>50</volume>
          <fpage>122</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.exger.2013.12.002</pub-id>
          <pub-id pub-id-type="medline">24333141</pub-id>
          <pub-id pub-id-type="pii">S0531-5565(13)00351-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Sol</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Serum anion gap at admission as a predictor of mortality in the pediatric intensive care unit</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>05</month>
          <day>03</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>1456</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/s41598-017-01681-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-017-01681-9</pub-id>
          <pub-id pub-id-type="medline">28469150</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-017-01681-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5431089</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Na</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>YS</given-names>
            </name>
          </person-group>
          <article-title>Serum anion gap predicts all-cause mortality in patients with advanced chronic kidney disease: a retrospective analysis of a randomized controlled study</article-title>
          <source>PLoS One</source>
          <year>2016</year>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>e0156381</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0156381"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0156381</pub-id>
          <pub-id pub-id-type="medline">27249416</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-10738</pub-id>
          <pub-id pub-id-type="pmcid">PMC4889106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sahu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Panza</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>The initial anion gap is a predictor of mortality in acute myocardial infarction</article-title>
          <source>Coron Artery Dis</source>
          <year>2006</year>
          <month>08</month>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>409</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="medline">16845247</pub-id>
          <pub-id pub-id-type="pii">00019501-200608000-00002</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
