<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v12i1e42271</article-id>
      <article-id pub-id-type="pmid">38354033</article-id>
      <article-id pub-id-type="doi">10.2196/42271</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Improving Prediction of Survival for Extremely Premature Infants Born at 23 to 29 Weeks Gestational Age in the Neonatal Intensive Care Unit: Development and Evaluation of Machine Learning Models</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Casal-Guisande</surname>
            <given-names>Manuel</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Meza</surname>
            <given-names>Francisco</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Angie</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biomedical Informatics</institution>
            <institution>Jacobs School of Medicine and Biomedical Sciences</institution>
            <institution>University at Buffalo</institution>
            <addr-line>77 Goodell Street</addr-line>
            <addr-line>Suite 540</addr-line>
            <addr-line>Buffalo, NY, 14203</addr-line>
            <country>United States</country>
            <phone>1 716 888 4858</phone>
            <email>ali83@buffalo.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8828-7402</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Mullin</surname>
            <given-names>Sarah</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5246-2202</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Elkin</surname>
            <given-names>Peter L</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9616-6811</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>Jacobs School of Medicine and Biomedical Sciences</institution>
        <institution>University at Buffalo</institution>
        <addr-line>Buffalo, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Angie Li <email>ali83@buffalo.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>2</month>
        <year>2024</year>
      </pub-date>
      <volume>12</volume>
      <elocation-id>e42271</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>8</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>17</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>12</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Angie Li, Sarah Mullin, Peter L Elkin. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 14.02.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2024/1/e42271" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Infants born at extremely preterm gestational ages are typically admitted to the neonatal intensive care unit (NICU) after initial resuscitation. The subsequent hospital course can be highly variable, and despite counseling aided by available risk calculators, there are significant challenges with shared decision-making regarding life support and transition to end-of-life care. Improving predictive models can help providers and families navigate these unique challenges.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Machine learning methods have previously demonstrated added predictive value for determining intensive care unit outcomes, and their use allows consideration of a greater number of factors that potentially influence newborn outcomes, such as maternal characteristics. Machine learning–based models were analyzed for their ability to predict the survival of extremely preterm neonates at initial admission.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Maternal and newborn information was extracted from the health records of infants born between 23 and 29 weeks of gestation in the Medical Information Mart for Intensive Care III (MIMIC-III) critical care database. Applicable machine learning models predicting survival during the initial NICU admission were developed and compared. The same type of model was also examined using only features that would be available prepartum for the purpose of survival prediction prior to an anticipated preterm birth. Features most correlated with the predicted outcome were determined when possible for each model.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Of included patients, 37 of 459 (8.1%) expired. The resulting random forest model showed higher predictive performance than the frequently used Score for Neonatal Acute Physiology With Perinatal Extension II (SNAPPE-II) NICU model when considering extremely preterm infants of very low birth weight. Several other machine learning models were found to have good performance but did not show a statistically significant difference from previously available models in this study. Feature importance varied by model, and those of greater importance included gestational age; birth weight; initial oxygenation level; elements of the APGAR (appearance, pulse, grimace, activity, and respiration) score; and amount of blood pressure support. Important prepartum features also included maternal age, steroid administration, and the presence of pregnancy complications.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Machine learning methods have the potential to provide robust prediction of survival in the context of extremely preterm births and allow for consideration of additional factors such as maternal clinical and socioeconomic information. Evaluation of larger, more diverse data sets may provide additional clarity on comparative performance.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>reproductive informatics</kwd>
        <kwd>pregnancy complications</kwd>
        <kwd>premature birth</kwd>
        <kwd>neonatal mortality</kwd>
        <kwd>machine learning</kwd>
        <kwd>clinical decision support</kwd>
        <kwd>preterm</kwd>
        <kwd>pediatrics</kwd>
        <kwd>intensive care unit outcome</kwd>
        <kwd>health care outcome</kwd>
        <kwd>survival prediction</kwd>
        <kwd>maternal health</kwd>
        <kwd>decision tree model</kwd>
        <kwd>socioeconomic</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Preterm birth has long been a leading cause of infant mortality, with the lowest gestational age births associated with the highest rates of mortality [<xref ref-type="bibr" rid="ref1">1</xref>]. In 2019, 59,506 infants were born at 31 weeks or less in the United States, and the infant mortality rate in this cohort was 18% [<xref ref-type="bibr" rid="ref2">2</xref>]. When a patient is expected to deliver an extremely preterm infant, counseling on possible outcomes, methods of resuscitation, and anticipated course in the neonatal intensive care unit (NICU) ideally begins prior to birth. Many providers have used the National Institute of Child Health and Human Development (NICHD) risk calculator to initiate this discussion on the chances of infant mortality and severe morbidity after birth. The calculator is based on a logistic regression model using 5 prepartum factors (gestational age, estimated weight, sex, antenatal steroids, and multiple birth), derived from the preterm birth data of a network of US hospitals. With advances in NICU care and more knowledge about long-term outcomes, the calculator was updated in 2020 and maintains a similar performance (mean 0.744, SD 0.005) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. After initial resuscitation, several scoring systems are also available to predict mortality after a neonate arrives in the NICU [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. However, they are less predictive with extremely low birth weight infants, as evidenced by the Score for Neonatal Acute Physiology With Perinatal Extension II (SNAPPE-II) survival model having a mean performance of 0.78 (SD 0.01) for infants weighing less than 1500 g at birth versus 0.91 (SD 0.01) overall. On review of several models, Clinical Risk Index for Babies (CRIB) had the highest performance in predicting very low birth weight neonate survival, with a mean of 0.88 (SD 0.02), although the CRIB and SNAPPE models were developed with data from geographically separate populations (Europe vs North America) [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>Despite counseling supported by available risk calculators, decisions surrounding the continuation of life support and redirection to end-of-life care remain extremely difficult in the context of birth at the periviable preterm gestational ages because the postnatal course can be highly variable [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. In addition, perceptions regarding the clinical situation can differ among providers and family members, and consideration of clinical and social context may be helpful [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>Numerous machine learning models have been tested to improve the prediction of adult intensive care unit outcomes. The Medical Information Mart for Intensive Care III (MIMIC-III) database, which contains electronic health record (EHR) information of critical care patients at the Beth Israel Deaconess Medical Center from 2001 to 2012, has often been a source of data used in their development and testing [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Using the NICU data from MIMIC-III, this study builds and compares different types of machine learning algorithms that predict neonatal mortality and examines the value of incorporating features representing both structured and unstructured clinical elements for extremely preterm infants.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>The institutional review board of the University at Buffalo determined the study (ID STUDY00003721) to be exempt as a secondary analysis of a publicly available data set. A data use agreement was obtained for the MIMIC-III database, which contains deidentified protected health information freely available for secondary analysis. The primary data collection for MIMIC-III was originally approved by the institutional review boards of Beth Israel Deaconess Medical Center and Massachusetts Institute of Technology with a waiver of individual patient consent, and no compensation was provided at that time.</p>
      </sec>
      <sec>
        <title>Data Selection</title>
        <p>Records of extremely preterm neonates admitted to the NICU in the MIMIC-III database were extracted using PostgreSQL (The PostgreSQL Global Development Group). A query was performed for admissions with <italic>ICD-9</italic> (<italic>International Classification of Diseases, Ninth Revision</italic>) codes corresponding to extremely preterm delivery less than 30 weeks as well as very low birth weight. From the resulting records, those of neonates born outside of 23 to 29 weeks were excluded, as well as duplicate records and readmissions. Some records corresponded to nonneonatal admissions, for example, where an infant had a prior history of preterm birth, and they were excluded. When the remaining records were reviewed, it was found that some neonates were transferred outside of the hospital for surgery and had an unknown outcome. These records were also excluded (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <p>From the 459 neonatal admission records that were selected, the patients’ demographics, vital signs, laboratory results, medications, procedures, and clinical text were queried from the database and reviewed. Of the available information, relevant elements were extracted based on factors found to be pertinent in previous scoring systems and expert knowledge. By manually curating the clinical text, including completed admission and discharge notes, we were able to incorporate features found only in unstructured form, including maternal clinical comorbidities and pregnancy complications. For this study, consideration of neonatal assessment and treatment was limited to data found initially at the time of NICU admission. The nonnumerical elements were encoded. Data that varied by clinical severity were encoded in that order, and the remaining categorical data underwent binary encoding. Median imputation was used to complete missing data.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of selection criteria. GA: gestational age; MIMIC-III: Medical Information Mart for Intensive Care III; NICU: neonatal intensive care unit.</p>
          </caption>
          <graphic xlink:href="medinform_v12i1e42271_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Ultimately, 83 features that could be used in machine learning algorithms were generated, of which approximately half represented maternal clinical and demographic information, with the remaining features representing infant findings at the time of admission (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      </sec>
      <sec>
        <title>Model Analysis</title>
        <p>Several machine learning classification algorithms were implemented using Python 3.8 scikit-learn 1.2, and the resulting models were tested for their efficacy in predicting mortality. The same algorithms were also examined considering only prepartum features, assuming birth weight would be an estimated weight, to produce models that could be of assistance for clinicians counseling patients prior to an extremely preterm birth.</p>
        <p>The performance of each model was endeavored to be optimized. To ensure that feature value range did not drive performance, standard scaling as well as min-max scaling were applied to quantitative features and used for models that were dependent upon distance calculations (eg, logistic regression, neural network, and support vector machine [SVM]). The final reported models used standard scaling due to improved performance over min-max scaling. Scaling was not performed for models invariant to monotonic transformations, such as random forest [<xref ref-type="bibr" rid="ref18">18</xref>]. For the decision tree–based models, the hyperparameters of number of trees and maximum depth were adjusted. Number of trees began at 50 estimators and was increased by 50 until performance plateaued, which was at 250 trees with a maximum depth of 6 for the random forest method and 350 trees with a maximum depth of 5 for AdaBoost. The k value in the k-nearest neighbor algorithm was adjusted from the default value of 3 up to 20 (approximating the square root of the number of samples), and performance peaked at 4 in the final model. Because of the expected relatively small and imbalanced class sizes (8.1% in the minority class), a held-out test set was not used, and 10-fold stratified cross-validation with an 80:20 training and testing ratio was performed to ensure similar ratios across folds [<xref ref-type="bibr" rid="ref19">19</xref>]. Mean performance metrics for <italic>F</italic><sub>1</sub>-score, area under the receiver operating characteristic (AUROC), and average precision are reported, as well as log loss and Brier score, where a smaller value is ideal when considering imbalanced classification.</p>
        <p>Features most correlated with the predicted outcome were determined for the higher-performing methods. For the logistic regression model, coefficients most positively and negatively associated with mortality could be determined. For the remaining machine learning models, the most influential features were either directly queried using an available scikit-learn method or through the calculation of feature permutation importance.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>Of the included neonatal patients, 37 of 459 (8.1%) expired during the admission period after birth. The average length of stay for infants who survived after initial admission was 62.5 (SD 37.3) days. The average gestational age of the neonates at birth was 27 (SD 1.67) weeks, and 236 (51.4%) were male versus 223 (48.6%) female. Birth weights ranged from 365 to 2165 g, with the average birth weight being 1016 (SD 278) g, and 441 neonates were considered to have a very low birth weight (&#60;1500 g). The average maternal age was 31.4 (SD 6.02) years. In terms of race and ethnicity, the majority of the included infants were in a category considered to be White (n=278, 60.1%), followed by Black (n=69, 15%), unknown (n=42, 9.2%), other (n=25, 5.4%), Hispanic (n=25, 5.4%), Asian (n=16, 3.5%), and Native American (n=4, 0.9%; <xref ref-type="table" rid="table1">Table 1</xref>).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Demographics of patients whose records were included in the study.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="230"/>
          <col width="220"/>
          <col width="260"/>
          <col width="260"/>
          <thead>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>Total (N=459), n (%)</td>
              <td>Survived (n=422, 91.9%), n (%)</td>
              <td>Expired (n=37, 8.1%), n (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5">
                <bold>Gestational age (weeks)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>23</td>
              <td>7 (1.5)</td>
              <td>2 (28.6)</td>
              <td>5 (71.4)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>24</td>
              <td>40 (8.7)</td>
              <td>28 (70)</td>
              <td>12 (30)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>25</td>
              <td>41 (8.9)</td>
              <td>36 (87.8)</td>
              <td>5 (12.2)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>26</td>
              <td>52 (11.3)</td>
              <td>49 (94.2)</td>
              <td>3 (5.8)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>27</td>
              <td>87 (19)</td>
              <td>84 (96.6)</td>
              <td>3 (3.4)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>28</td>
              <td>106 (23.1)</td>
              <td>98 (92.5)</td>
              <td>8 (7.5)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>29</td>
              <td>126 (27.5)</td>
              <td>125 (99.2)</td>
              <td>1 (0.8)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Sex</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Male</td>
              <td>236 (51.4)</td>
              <td>214 (90.7)</td>
              <td>22 (9.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Female</td>
              <td>223 (48.6)</td>
              <td>208 (93.3)</td>
              <td>15 (6.7)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Race</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Asian</td>
              <td>16 (3.5)</td>
              <td>15 (93.7)</td>
              <td>1 (6.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Black</td>
              <td>69 (15)</td>
              <td>62 (89.9)</td>
              <td>7 (10.1)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Hispanic</td>
              <td>25 (5.4)</td>
              <td>23 (92)</td>
              <td>2 (8)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Native American</td>
              <td>4 (0.9)</td>
              <td>3 (75)</td>
              <td>1 (25)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>White</td>
              <td>278 (60.1)</td>
              <td>255 (91.7)</td>
              <td>23 (8.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Other</td>
              <td>25 (5.4)</td>
              <td>23 (92)</td>
              <td>2 (8)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Unknown</td>
              <td>42 (9.2)</td>
              <td>41 (97.6)</td>
              <td>1 (2.4)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Insurance</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Private</td>
              <td>343 (74.7)</td>
              <td>311 (90.7)</td>
              <td>32 (9.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Government</td>
              <td>116 (25.3)</td>
              <td>113 (97.4)</td>
              <td>3 (2.6)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Uninsured</td>
              <td>2 (0.4)</td>
              <td>0 (0)</td>
              <td>2 (100)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Family religion</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Catholic</td>
              <td>100 (21.8)</td>
              <td>91 (91)</td>
              <td>9 (9)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Protestant</td>
              <td>24 (5.2)</td>
              <td>22 (91.7)</td>
              <td>2 (8.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Jewish</td>
              <td>16 (3.5)</td>
              <td>15 (93.7)</td>
              <td>1 (6.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Other</td>
              <td>30 (6.5)</td>
              <td>25 (83.3)</td>
              <td>5 (16.7)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Unknown</td>
              <td>289 (63)</td>
              <td>269 (93.1)</td>
              <td>20 (6.9)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Type of delivery</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Cesarean section</td>
              <td>356 (77.6)</td>
              <td>331 (93)</td>
              <td>25 (7)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Vaginal delivery</td>
              <td>103 (22.4)</td>
              <td>91 (88.3)</td>
              <td>12 (11.7)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Pregnancy type</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Singleton</td>
              <td>247 (53.8)</td>
              <td>230 (93.1)</td>
              <td>17 (6.9)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Multiple</td>
              <td>212 (46.2)</td>
              <td>192 (90.6)</td>
              <td>20 (9.4)</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Antenatal steroids</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Received</td>
              <td>369 (80.4)</td>
              <td>347 (94)</td>
              <td>22 (6)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Partially received</td>
              <td>71 (15.5)</td>
              <td>65 (91.5)</td>
              <td>6 (8.5)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Not received</td>
              <td>19 (4.1)</td>
              <td>14 (73.7)</td>
              <td>5 (26.3)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>Logistic regression, Naïve Bayes, k-nearest neighbor, SVM, random forest, AdaBoost, and neural network classifiers were compared for efficacy in predicting mortality (<xref rid="figure2" ref-type="fig">Figure 2</xref> and <xref ref-type="table" rid="table2">Table 2</xref>). Standard scaling transformation improved performance only for the logistic regression, SVM, and neural network methods. The random forest model had the highest predictive performance when considering overall AUROC (mean 0.91, SD 0.07), <italic>F</italic><sub>1</sub>-score (0.67), and Brier score (0.06). The AdaBoost model had the next highest AUROC (mean 0.88, SD 0.10); however, the <italic>F</italic><sub>1</sub>-score (0.45) was low due to poor precision. On the other hand, the neural network model yielded the top <italic>F</italic><sub>1</sub>-score (0.67) and Brier score (0.05) despite having a lower AUROC (mean 0.84, SD 0.16). SVM was overall next best performing model (mean 0.86, SD 0.13; <italic>F</italic><sub>1</sub>-score 0.62; Brier score 0.06), followed by logistic regression (mean 0.82, SD 0.16; <italic>F</italic><sub>1</sub>-score 0.61; Brier score 0.08). The Naïve Bayes (mean 0.74, SD 0.22; <italic>F</italic><sub>1</sub>-score 0.40; Brier score 0.25) and k-nearest neighbor (mean 0.64, SD 0.13; <italic>F</italic><sub>1</sub>-score 0.34; Brier score 0.07) methods were the worst performing.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Receiver operating characteristic curves for the highest-performing models in <xref ref-type="table" rid="table2">Table 2</xref>. A: Logistic regression; B: SVM (support vector machine); C: Random forest; D: AdaBoost; E: Neural networks, F: Naïve Bayes; AUROC: area under the receiver operating characteristic; FP: false positive; TP: true positive.</p>
        </caption>
        <graphic xlink:href="medinform_v12i1e42271_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>AUROC<sup>a</sup>, average precision, F1-score, log loss, and Brier scores for 10-fold stratified cross-validation predicting mortality using initial neonatal intensive care unit admission features (lower log loss and Brier scores are ideal when considering imbalanced classification).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="240"/>
          <col width="200"/>
          <col width="200"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td>Method</td>
              <td>AUROC, mean (SD)</td>
              <td>Precision, mean (SD)</td>
              <td><italic>F</italic><sub>1</sub>-score</td>
              <td>Log loss score</td>
              <td>Brier score</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Logistic regression</td>
              <td>0.82 (0.16)</td>
              <td>0.55 (0.25)</td>
              <td>0.61</td>
              <td>0.35</td>
              <td>0.08</td>
            </tr>
            <tr valign="top">
              <td>SVM<sup>b</sup></td>
              <td>0.86 (0.13)</td>
              <td>0.61 (0.24)</td>
              <td>0.62</td>
              <td>0.20</td>
              <td>0.06</td>
            </tr>
            <tr valign="top">
              <td>Random forest</td>
              <td>0.91 (0.07)</td>
              <td>0.61 (0.22)</td>
              <td>0.67</td>
              <td>0.19</td>
              <td>0.06</td>
            </tr>
            <tr valign="top">
              <td>AdaBoost</td>
              <td>0.88 (0.10)</td>
              <td>0.55 (0.25)</td>
              <td>0.45</td>
              <td>0.80</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>Neural network</td>
              <td>0.84 (0.16)</td>
              <td>0.65 (0.24)</td>
              <td>0.67</td>
              <td>0.30</td>
              <td>0.05</td>
            </tr>
            <tr valign="top">
              <td>Naïve Bayes</td>
              <td>0.74 (0.22)</td>
              <td>0.39 (0.17)</td>
              <td>0.40</td>
              <td>3.90</td>
              <td>0.25</td>
            </tr>
            <tr valign="top">
              <td>K-nearest neighbor</td>
              <td>0.64 (0.13)</td>
              <td>0.24 (0.16)</td>
              <td>0.34</td>
              <td>1.74</td>
              <td>0.07</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>AUROC: area under the receiver operating characteristic.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>SVM: support vector machine.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>On post hoc chi-square analysis of the categorical variables, the factors that most influenced the outcome were insurance status, initial breathing assessment of the infant, and presence of a serious fetal anomaly (<xref ref-type="table" rid="table3">Table 3</xref>). When examining Pearson correlation of continuous variables, higher levels of ventilation and blood pressure support as well as higher arterial blood gas base deficit were properties mildly to moderately correlated with mortality. Larger gestational age, birth weight, and higher APGAR (appearance, pulse, grimace, activity, and respiration) scores at birth negatively correlated with mortality to a similar degree (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
      <p>Similar features were most strongly associated with outcome in the machine learning–based models, although they varied in importance (<xref ref-type="table" rid="table5">Table 5</xref>). For example, in the random forest model, gestational age, birth weight, and initial oxygen level were of higher importance, whereas in the neural network model, initial blood pressure support and activity level were the most influential features.</p>
      <p>Evaluation of classifiers using only prepartum features, assuming birth weight as the estimated weight, also yielded the highest performance measures with the random forest method (<xref ref-type="table" rid="table6">Table 6</xref>). The random forest features that were consistently of highest importance included gestational age, weight, and maternal age (<xref ref-type="table" rid="table7">Table 7</xref>).</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Chi-square: categorical features significantly associated with outcome.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="300"/>
          <col width="450"/>
          <col width="250"/>
          <thead>
            <tr valign="top">
              <td>Feature</td>
              <td>Description</td>
              <td>Chi-square (<italic>df</italic>)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>un_ins</td>
              <td>Uninsured</td>
              <td>22.8 (1)</td>
            </tr>
            <tr valign="top">
              <td>breathing1</td>
              <td>Initial breathing assessment</td>
              <td>21.4 (2)</td>
            </tr>
            <tr valign="top">
              <td>anomaly</td>
              <td>Serious fetal anomaly</td>
              <td>20.8 (1)</td>
            </tr>
            <tr valign="top">
              <td>airway1</td>
              <td>Initial type of airway or ventilation</td>
              <td>17.1 (4)</td>
            </tr>
            <tr valign="top">
              <td>religion_jehovahs</td>
              <td>Religion Jehovah’s Witness</td>
              <td>11.4 (1)</td>
            </tr>
            <tr valign="top">
              <td>twintwin</td>
              <td>Twin-twin transfusion syndrome</td>
              <td>9.4 (1)</td>
            </tr>
            <tr valign="top">
              <td>uncertain</td>
              <td>Uncertain pregnancy dating</td>
              <td>7.9 (1)</td>
            </tr>
            <tr valign="top">
              <td>religion_other</td>
              <td>Religion other</td>
              <td>4.9 (1)</td>
            </tr>
            <tr valign="top">
              <td>gov_ins</td>
              <td>Medicaid or Medicare insurance</td>
              <td>4.7 (1)</td>
            </tr>
            <tr valign="top">
              <td>muscle1</td>
              <td>Muscle tone</td>
              <td>4.6 (4)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table4">
        <label>Table 4</label>
        <caption>
          <p>Pearson correlation: correlation of continuous features with mortality.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="300"/>
          <col width="450"/>
          <col width="250"/>
          <thead>
            <tr valign="top">
              <td>Feature</td>
              <td>Description</td>
              <td>Correlation</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>FiO2_1</td>
              <td>Initial amount of oxygen ventilation</td>
              <td>0.28</td>
            </tr>
            <tr valign="top">
              <td>BD1</td>
              <td>Initial arterial blood gas base deficit</td>
              <td>0.23</td>
            </tr>
            <tr valign="top">
              <td>dopa1</td>
              <td>Initial IV<sup>a</sup> dopamine rate</td>
              <td>0.20</td>
            </tr>
            <tr valign="top">
              <td>temp1</td>
              <td>Initial temperature</td>
              <td>0.14</td>
            </tr>
            <tr valign="top">
              <td>pCO2_1</td>
              <td>Initial arterial blood gas pCO<sub>2</sub><sup>b</sup></td>
              <td>0.13</td>
            </tr>
            <tr valign="top">
              <td>G</td>
              <td>Maternal gravidity</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>P</td>
              <td>Maternal parity</td>
              <td>0.06</td>
            </tr>
            <tr valign="top">
              <td>PRBC1</td>
              <td>Initial IV blood transfusion amount</td>
              <td>0.06</td>
            </tr>
            <tr valign="top">
              <td>maternal_age</td>
              <td>Maternal age</td>
              <td>0.05</td>
            </tr>
            <tr valign="top">
              <td>gluc1</td>
              <td>Initial glucose</td>
              <td>0.03</td>
            </tr>
            <tr valign="top">
              <td>bands1</td>
              <td>Initial bands</td>
              <td>0.03</td>
            </tr>
            <tr valign="top">
              <td>multiple</td>
              <td>Number of fetuses at delivery</td>
              <td>0.02</td>
            </tr>
            <tr valign="top">
              <td>pO2_1</td>
              <td>Initial arterial blood gas pO<sub>2</sub><sup>c</sup></td>
              <td>–0.01<sup>d</sup></td>
            </tr>
            <tr valign="top">
              <td>wbc1</td>
              <td>Initial white blood cells</td>
              <td>–0.02</td>
            </tr>
            <tr valign="top">
              <td>BPmean1</td>
              <td>Initial mean blood pressure</td>
              <td>–0.04</td>
            </tr>
            <tr valign="top">
              <td>monos1</td>
              <td>Initial monocytes</td>
              <td>–0.05</td>
            </tr>
            <tr valign="top">
              <td>HR1</td>
              <td>Initial heart rate</td>
              <td>–0.05</td>
            </tr>
            <tr valign="top">
              <td>hct1</td>
              <td>Initial hematocrit</td>
              <td>–0.07</td>
            </tr>
            <tr valign="top">
              <td>neuts1</td>
              <td>Initial neutrophil count</td>
              <td>–0.07</td>
            </tr>
            <tr valign="top">
              <td>SaO2_1</td>
              <td>Initial oxygen saturation</td>
              <td>–0.20</td>
            </tr>
            <tr valign="top">
              <td>birth_wt</td>
              <td>Birth weight</td>
              <td>–0.22</td>
            </tr>
            <tr valign="top">
              <td>GA</td>
              <td>Gestational age at birth</td>
              <td>–0.32</td>
            </tr>
            <tr valign="top">
              <td>apgar1</td>
              <td>One-minute APGAR<sup>e</sup> score</td>
              <td>–0.32</td>
            </tr>
            <tr valign="top">
              <td>apgar5</td>
              <td>Five-minute APGAR score</td>
              <td>–0.35</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table4fn1">
            <p><sup>a</sup>IV: intravenous.</p>
          </fn>
          <fn id="table4fn2">
            <p><sup>b</sup>pCO<sub>2</sub>: partial pressure of carbon dioxide</p>
          </fn>
          <fn id="table4fn3">
            <p><sup>c</sup>pO<sub>2</sub>: partial pressure of oxygen.</p>
          </fn>
          <fn id="table4fn4">
            <p><sup>d</sup>Negative correlations with mortality imply a correlation with survival.</p>
          </fn>
          <fn id="table4fn5">
            <p><sup>e</sup>APGAR: appearance, pulse, grimace, activity, and respiration.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table5">
        <label>Table 5</label>
        <caption>
          <p>Features of highest importance in various models, listed in order of importance. Positive and negative associations with mortality can be calculated only in logistic regression models. For the tree-based random forest and AdaBoost algorithms, an impurity-based method was used to determine overall feature importance. For the remaining algorithms, importance was found via feature permutation<sup>a</sup>.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="260"/>
          <col width="260"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td>Logistic regression: positively associated with mortality</td>
              <td>Logistic regression: negatively associated with mortality</td>
              <td>Random forest</td>
              <td>AdaBoost</td>
              <td>SVM<sup>b</sup></td>
              <td>Neural network</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>race_hispanic</td>
              <td>GA</td>
              <td>GA</td>
              <td>neuts1</td>
              <td>activity1</td>
              <td>dopa1</td>
            </tr>
            <tr valign="top">
              <td>color1</td>
              <td>race_unk</td>
              <td>birth_wt</td>
              <td>hct1</td>
              <td>GA</td>
              <td>activity1</td>
            </tr>
            <tr valign="top">
              <td>anomaly</td>
              <td>apgar1</td>
              <td>SaO2_1</td>
              <td>SaO2_1</td>
              <td>HTN</td>
              <td>multiple</td>
            </tr>
            <tr valign="top">
              <td>race_asian</td>
              <td>gov_ins</td>
              <td>BD1</td>
              <td>wbc1</td>
              <td>anomaly</td>
              <td>uncertain</td>
            </tr>
            <tr valign="top">
              <td>un_ins</td>
              <td>activity1</td>
              <td>apgar1</td>
              <td>apgar1</td>
              <td>breathL1</td>
              <td>race_unk</td>
            </tr>
            <tr valign="top">
              <td>dopa1</td>
              <td>monos1</td>
              <td>gluc1</td>
              <td>monos1</td>
              <td>breathR1</td>
              <td>twintwin</td>
            </tr>
            <tr valign="top">
              <td>abdomen1</td>
              <td>breathL1</td>
              <td>dopa1</td>
              <td>temp1</td>
              <td>twintwin</td>
              <td>anomaly</td>
            </tr>
            <tr valign="top">
              <td>pvt_ins</td>
              <td>PRBC1</td>
              <td>apgar5</td>
              <td>HR1</td>
              <td>birth_wt</td>
              <td>muscle1</td>
            </tr>
            <tr valign="top">
              <td>multiple</td>
              <td>infert</td>
              <td>FiO2_1</td>
              <td>FiO2_1</td>
              <td>antfont1</td>
              <td>wbc1</td>
            </tr>
            <tr valign="top">
              <td>FiO2_1</td>
              <td>dm</td>
              <td>neuts</td>
              <td>bands1</td>
              <td>caprefill1</td>
              <td>abdomen1</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table5fn1">
            <p><sup>a</sup>The descriptions of variable names are present in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          </fn>
          <fn id="table5fn2">
            <p><sup>b</sup>SVM: support vector machine.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table6">
        <label>Table 6</label>
        <caption>
          <p>AUROC<sup>a</sup>, average precision, F1-score, log loss, and Brier scores for 10-fold stratified cross-validation predicting mortality when only prepartum features are available (lower log loss and Brier scores are ideal when considering imbalanced classification).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="240"/>
          <col width="200"/>
          <col width="200"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td>Method</td>
              <td>AUROC, mean (SD)</td>
              <td>Precision, mean (SD)</td>
              <td><italic>F</italic><sub>1</sub>-score</td>
              <td>Log loss score</td>
              <td>Brier score</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Logistic regression</td>
              <td>0.77 (0.14)</td>
              <td>0.41 (0.18)</td>
              <td>0.51</td>
              <td>0.29</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>SVM<sup>b</sup></td>
              <td>0.76 (0.10)</td>
              <td>0.37 (0.15)</td>
              <td>0.46</td>
              <td>0.25</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>Random forest</td>
              <td>0.80 (0.14)</td>
              <td>0.54 (0.27)</td>
              <td>0.59</td>
              <td>0.22</td>
              <td>0.06</td>
            </tr>
            <tr valign="top">
              <td>AdaBoost</td>
              <td>0.75 (0.17)</td>
              <td>0.44 (0.29)</td>
              <td>0.54</td>
              <td>0.27</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>Neural network</td>
              <td>0.76 (0.11)</td>
              <td>0.44 (0.18)</td>
              <td>0.53</td>
              <td>0.31</td>
              <td>0.07</td>
            </tr>
            <tr valign="top">
              <td>Naïve Bayes</td>
              <td>0.68 (0.21)</td>
              <td>0.30 (0.11)</td>
              <td>0.19</td>
              <td>6.09</td>
              <td>0.59</td>
            </tr>
            <tr valign="top">
              <td>K-nearest neighbor</td>
              <td>0.62 (0.12)</td>
              <td>0.20 (0.12)</td>
              <td>0.30</td>
              <td>1.77</td>
              <td>0.09</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table6fn1">
            <p><sup>a</sup>AUROC: area under the receiver operating characteristic.</p>
          </fn>
          <fn id="table6fn2">
            <p><sup>b</sup>SVM: support vector machine.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table7">
        <label>Table 7</label>
        <caption>
          <p>Prepartum features of highest importance in various models, listed in order of importance<sup>a</sup>.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="260"/>
          <col width="260"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td>Logistic regression: positively associated with mortality</td>
              <td>Logistic regression: negatively associated with mortality</td>
              <td>Random forest</td>
              <td>AdaBoost</td>
              <td>SVM<sup>b</sup></td>
              <td>Neural network</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>maternal_age</td>
              <td>GA</td>
              <td>GA</td>
              <td>birth_wt</td>
              <td>GA</td>
              <td>un_ins</td>
            </tr>
            <tr valign="top">
              <td>anomaly</td>
              <td>race_unk</td>
              <td>birth_wt</td>
              <td>maternal_age</td>
              <td>steroids</td>
              <td>steroids</td>
            </tr>
            <tr valign="top">
              <td>un_ins</td>
              <td>dm</td>
              <td>maternal_age</td>
              <td>GA</td>
              <td>P</td>
              <td>HTN</td>
            </tr>
            <tr valign="top">
              <td>asthma</td>
              <td>depression</td>
              <td>anomaly</td>
              <td>G</td>
              <td>infert</td>
              <td>GA</td>
            </tr>
            <tr valign="top">
              <td>religion_jehovahs</td>
              <td>PTL</td>
              <td>G</td>
              <td>multiple</td>
              <td>G</td>
              <td>anomaly</td>
            </tr>
            <tr valign="top">
              <td>pvt_ins</td>
              <td>steroids</td>
              <td>P</td>
              <td>religion_unk</td>
              <td>uncertain</td>
              <td>twintwin</td>
            </tr>
            <tr valign="top">
              <td>race_hispanic</td>
              <td>gov_ins</td>
              <td>un_ins</td>
              <td>steroids</td>
              <td>birth_wt</td>
              <td>race_unk</td>
            </tr>
            <tr valign="top">
              <td>twintwin</td>
              <td>HTN</td>
              <td>steroids</td>
              <td>sex</td>
              <td>sex</td>
              <td>sex</td>
            </tr>
            <tr valign="top">
              <td>uncertain</td>
              <td>infert</td>
              <td>uncertain</td>
              <td>anomaly</td>
              <td>multiple</td>
              <td>P</td>
            </tr>
            <tr valign="top">
              <td>multiple</td>
              <td>P</td>
              <td>twintwin</td>
              <td>P</td>
              <td>anomaly</td>
              <td>SVD</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table7fn1">
            <p><sup>a</sup>The descriptions of variable names are present in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          </fn>
          <fn id="table7fn2">
            <p><sup>b</sup>SVM: support vector machine.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>Several of the important features found in the top-performing models were among those manually curated in unstructured form, including the presence of maternal hypertensive disease and diabetes, uncertain pregnancy dating (uncertain), fetal anomaly (anomaly), and twin-twin transfusion syndrome.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>There is a potential for existing risk calculators to be outperformed by tree-based machine learning algorithms, as indicated by the higher performance of our random forest model versus SNAPPE-II in the context of extremely premature or very low birth weight infants (in fact AUROC increased to mean 0.92, SD 0.05 when only the neonates &#60;1500 g were considered in the random forest model to directly compare to SNAPPE-II). Performance difference compared with CRIB is inconclusive, however. In terms of estimating neonatal mortality prior to preterm birth, although the point estimates of several of the machine learning algorithms using additional features extracted from the EHR were higher than that of the NICHD calculator, overlapping CIs preclude any conclusion about significant differences in performance.</p>
      </sec>
      <sec>
        <title>Comparison to Prior Work</title>
        <p>Examination of prior work further points to the importance of using data available from the EHR, including unstructured health data. For example, the relatively high-performing CRIB score includes the presence of fetal malformation as a variable. Saria et al [<xref ref-type="bibr" rid="ref20">20</xref>] incorporated signal processing of short-term time series data from neonatal vital sign sensors to produce a model classifying infants at high risk for severe morbidity or mortality. To maintain accuracy over time, Meadow et al [<xref ref-type="bibr" rid="ref11">11</xref>] proposed a longitudinal NICU survival model combining adverse events, imaging report information, and caretaker intuition. Hamilton et al [<xref ref-type="bibr" rid="ref21">21</xref>] more recently applied tree-based machine learning in the context of preterm birth to determine clusters of pregnancy characteristics that were at the highest risk for severe neonatal morbidity or mortality.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>This study is limited by a small data set with data from a single institution, which in turn limits the ability to establish statistical significance in performance differences and the variety of machine learning methods that can be examined. Because of the retrospective nature of the study, there is less control over the format of the data and the amount of missing data. Although a single-institution data set is usually considered a limitation, Rysavy et al [<xref ref-type="bibr" rid="ref4">4</xref>] emphasized that extremely preterm neonatal outcomes are significantly influenced by the hospital of birth and suggested maintaining ongoing and updated prediction models from outcomes within hospital systems. Using machine learning would be ideal for this task, allowing for consideration of a number of features retrievable from the EHR with a high tolerance for missing or outlier data as the volume of data increases. Tree-based machine learning algorithms may be additionally advantageous due to their ability to iteratively combine numerous weakly predictive features into stronger predictors.</p>
        <p>Knowledge of the most influential features, which was possible to visualize in the majority of the presented models, provides transparency. Understanding which factors contribute most to the prediction of outcomes in a model can help clinical providers derive greater intuition regarding how applicable the model is to a particular patient.</p>
        <p>The inclusion of maternal information and pregnancy characteristics found in unstructured form in the MIMIC-III database allowed for consideration of factors beyond the numerical neonatal data. Some of these additional variables, such as the presence of fetal anomalies or twin-twin transfusion syndrome, were found to be of high importance in several top-performing models, especially in those used in the prepartum period prior to an anticipated extremely preterm delivery. This illustrates that machine learning–based models could potentially be helpful for continuity of care, starting in the prepartum timeframe with ongoing predictive ability after birth. Maternal demographic information had an influence on mortality prediction in some of the higher-performing models but not others. Although demographic data can provide additional knowledge of social context, unintended bias can also be introduced into the resulting model [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>Future work anticipates further evaluation of these methods on larger, more diverse data sets to determine if there is a significant and reproducible performance advantage. Expanding the study to include additional data would also allow the evaluation of more powerful machine learning methods such as deep learning methods. Eventually, the maintenance of a more representative and up-to-date cohort for training could potentially be accomplished via collaborative or federated learning techniques across institutions [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. To address the possibility of algorithmic bias, further work could include a comparison of prediction results using models with and without protected demographic features and a calculation of the level of discrimination that could result. Assessment of more data from underrepresented groups may also aid in producing increasingly accurate and less discriminatory models [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        <p>In this study, unstructured information was manually extracted from admission and discharge notes in the MIMIC-III database and allowed for consideration of additional relevant features in our models. This suggests that the use of natural language processing to better understand clinical context may further improve the prediction of outcomes of extremely preterm births. As automated natural language processing of clinical notes becomes more mature and prevalent, the use of these features gleaned from unstructured EHR data will be increasingly applicable [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Additional potential future directions include integrating with or adding functionalities found in other intensive care unit models, such as time series modeling, and predicting outcomes other than mortality, such as the development of comorbidities, discharge location, length of stay, and likelihood of readmission.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study examined machine learning models produced from the MIMIC-III NICU data set and their predictive ability in the clinically challenging situation of extremely preterm birth. The tree-based random forest model was found to have higher performance than the SNAPPE-II model when predicting the survival of extremely preterm infants of very low birth weight. Several other models, including those using only features that would be known prepartum, also appeared to have good predictive performance but failed to show a statistically significant difference from prior models. Features of highest importance in these models were explored and included traditional variables, such as gestational age and birth weight, but also information that may be found in unstructured form in the EHR. Evaluation of these and even more advanced machine learning methods on larger data sets may offer further clarity about performance differences, and natural language processing techniques would allow for greater use of unstructured clinical information.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Categorical and continuous features.</p>
        <media xlink:href="medinform_v12i1e42271_app1.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>TRIPOD checklist for model development.</p>
        <media xlink:href="medinform_v12i1e42271_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 825 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">APGAR</term>
          <def>
            <p>appearance, pulse, grimace, activity, and respiration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CRIB</term>
          <def>
            <p>Clinical Risk Index for Babies</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">
            <italic>ICD-9</italic>
          </term>
          <def>
            <p>
              <italic>International Classification of Diseases, Ninth Revision</italic>
            </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MIMIC-III</term>
          <def>
            <p>Medical Information Mart for Intensive Care III</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">NICHD</term>
          <def>
            <p>National Institute of Child Health and Human Development</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NICU</term>
          <def>
            <p>neonatal intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SNAPPE-II</term>
          <def>
            <p>Score for Neonatal Acute Physiology With Perinatal Extension II</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by a National Institutes of Health National Library of Medicine training grant (T15 LM012495-02). Generative artificial intelligence was not used in any portion of the paper writing.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets analyzed in this study are available in the Medical Information Mart for Intensive Care III (MIMIC-III) Clinical Database [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>AL and PLE conceptualized study methodology. AL and SM participated in data curation, statistical analysis, and writing. All authors reviewed the final paper.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stoll</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hansen</surname>
              <given-names>NI</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>EF</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Carlo</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Shankaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Laptook</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Sánchez</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Van Meurs</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Wyckoff</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hale</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Schibler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Poindexter</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Kennedy</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Cotten</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Watterberg</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>D'Angio</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>DeMauro</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Truog</surname>
              <given-names>WE</given-names>
            </name>
            <name name-style="western">
              <surname>Devaskar</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>RD</given-names>
            </name>
          </person-group>
          <article-title>Trends in care practices, morbidity, and mortality of extremely preterm neonates, 1993-2012</article-title>
          <source>JAMA</source>
          <year>2015</year>
          <volume>314</volume>
          <issue>10</issue>
          <fpage>1039</fpage>
          <lpage>1051</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26348753"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2015.10244</pub-id>
          <pub-id pub-id-type="medline">26348753</pub-id>
          <pub-id pub-id-type="pii">2434683</pub-id>
          <pub-id pub-id-type="pmcid">PMC4787615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ely</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Driscoll</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Infant mortality in the United States, 2019: data from the period linked birth/infant death file</article-title>
          <source>Natl Vital Stat Rep</source>
          <year>2021</year>
          <volume>70</volume>
          <issue>14</issue>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://stacks.cdc.gov/view/cdc/111053"/>
          </comment>
          <pub-id pub-id-type="doi">10.15620/cdc:111053</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dance</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Survival of the littlest: the long-term impacts of being born extremely early</article-title>
          <source>Nature</source>
          <year>2020</year>
          <volume>582</volume>
          <issue>7810</issue>
          <fpage>20</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1038/d41586-020-01517-z</pub-id>
          <pub-id pub-id-type="medline">32488165</pub-id>
          <pub-id pub-id-type="pii">10.1038/d41586-020-01517-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rysavy</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Horbar</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>EF</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Greenberg</surname>
              <given-names>LT</given-names>
            </name>
            <name name-style="western">
              <surname>Tyson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Carlo</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Younge</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Hintz</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Buzas</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>RD</given-names>
            </name>
          </person-group>
          <article-title>Assessment of an updated neonatal research network extremely preterm birth outcome model in the Vermont Oxford Network</article-title>
          <source>JAMA Pediatr</source>
          <year>2020</year>
          <volume>174</volume>
          <issue>5</issue>
          <fpage>e196294</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32119065"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamapediatrics.2019.6294</pub-id>
          <pub-id pub-id-type="medline">32119065</pub-id>
          <pub-id pub-id-type="pii">2761306</pub-id>
          <pub-id pub-id-type="pmcid">PMC7052789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Corcoran</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Escobar</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>SNAP-II and SNAPPE-II: simplified newborn illness severity and mortality risk scores</article-title>
          <source>J Pediatr</source>
          <year>2001</year>
          <volume>138</volume>
          <issue>1</issue>
          <fpage>92</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.1067/mpd.2001.109608</pub-id>
          <pub-id pub-id-type="medline">11148519</pub-id>
          <pub-id pub-id-type="pii">S0022347601516017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parry</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tarnow-Mordi</surname>
              <given-names>W</given-names>
            </name>
            <collab>UK Neonatal Staffing Study Collaborative Group</collab>
          </person-group>
          <article-title>CRIB II: an update of the clinical risk index for babies score</article-title>
          <source>Lancet</source>
          <year>2003</year>
          <volume>361</volume>
          <issue>9371</issue>
          <fpage>1789</fpage>
          <lpage>1791</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(03)13397-1</pub-id>
          <pub-id pub-id-type="medline">12781540</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(03)13397-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Groenendaal</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>de Vos</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Derks</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Mulder</surname>
              <given-names>EJH</given-names>
            </name>
          </person-group>
          <article-title>Improved SNAPPE-II and CRIB II scores over a 15-year period</article-title>
          <source>J Perinatol</source>
          <year>2017</year>
          <volume>37</volume>
          <issue>5</issue>
          <fpage>547</fpage>
          <lpage>551</lpage>
          <pub-id pub-id-type="doi">10.1038/jp.2016.276</pub-id>
          <pub-id pub-id-type="medline">28125092</pub-id>
          <pub-id pub-id-type="pii">jp2016276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McLeod</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Matusko</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Gadepalli</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Barks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mychaliska</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Perrone</surname>
              <given-names>EE</given-names>
            </name>
          </person-group>
          <article-title>Comparing mortality risk models in VLBW and preterm infants: systematic review and meta-analysis</article-title>
          <source>J Perinatol</source>
          <year>2020</year>
          <volume>40</volume>
          <issue>5</issue>
          <fpage>695</fpage>
          <lpage>703</lpage>
          <pub-id pub-id-type="doi">10.1038/s41372-020-0650-0</pub-id>
          <pub-id pub-id-type="medline">32203174</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41372-020-0650-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andrews</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lagatta</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meadow</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A comparison of prenatal and postnatal models to predict outcomes at the border of viability</article-title>
          <source>J Pediatr</source>
          <year>2016</year>
          <volume>173</volume>
          <fpage>96</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpeds.2016.02.042</pub-id>
          <pub-id pub-id-type="medline">26995702</pub-id>
          <pub-id pub-id-type="pii">S0022-3476(16)00264-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dupont-Thibodeau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barrington</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Farlow</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Janvier</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>End-of-life decisions for extremely low-gestational-age infants: why simple rules for complicated decisions should be avoided</article-title>
          <source>Semin Perinatol</source>
          <year>2014</year>
          <volume>38</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1053/j.semperi.2013.07.006</pub-id>
          <pub-id pub-id-type="medline">24468567</pub-id>
          <pub-id pub-id-type="pii">S0146-0005(13)00105-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meadow</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lagatta</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Andrews</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lantos</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The mathematics of morality for neonatal resuscitation</article-title>
          <source>Clin Perinatol</source>
          <year>2012</year>
          <volume>39</volume>
          <issue>4</issue>
          <fpage>941</fpage>
          <lpage>956</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23164189"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.clp.2012.09.013</pub-id>
          <pub-id pub-id-type="medline">23164189</pub-id>
          <pub-id pub-id-type="pii">S0095-5108(12)00109-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4506790</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hellmann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Knighton</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>PS</given-names>
            </name>
            <collab>Canadian Neonatal Network End of Life Study Group</collab>
          </person-group>
          <article-title>Neonatal deaths: prospective exploration of the causes and process of end-of-life decisions</article-title>
          <source>Arch Dis Child Fetal Neonatal Ed</source>
          <year>2016</year>
          <volume>101</volume>
          <issue>2</issue>
          <fpage>F102</fpage>
          <lpage>F107</lpage>
          <pub-id pub-id-type="doi">10.1136/archdischild-2015-308425</pub-id>
          <pub-id pub-id-type="medline">26253166</pub-id>
          <pub-id pub-id-type="pii">archdischild-2015-308425</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steurer</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baer</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Oltman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Franck</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Kuppermann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rand</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ryckman</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Partridge</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Jelliffe-Pawlowski</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>EE</given-names>
            </name>
          </person-group>
          <article-title>Dynamic outcome prediction in a socio-demographically diverse population-based cohort of extremely preterm neonates</article-title>
          <source>J Perinatol</source>
          <year>2017</year>
          <volume>37</volume>
          <issue>6</issue>
          <fpage>709</fpage>
          <lpage>715</lpage>
          <pub-id pub-id-type="doi">10.1038/jp.2017.9</pub-id>
          <pub-id pub-id-type="medline">28206998</pub-id>
          <pub-id pub-id-type="pii">jp20179</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AEW</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LWH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/sdata201635"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Predictive modeling in urgent care: a comparative study of machine learning approaches</article-title>
          <source>JAMIA Open</source>
          <year>2018</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>87</fpage>
          <lpage>98</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31984321"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooy011</pub-id>
          <pub-id pub-id-type="medline">31984321</pub-id>
          <pub-id pub-id-type="pii">ooy011</pub-id>
          <pub-id pub-id-type="pmcid">PMC6951928</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Purushotham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking deep learning models on large healthcare datasets</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <volume>83</volume>
          <fpage>112</fpage>
          <lpage>134</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30071-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.04.007</pub-id>
          <pub-id pub-id-type="medline">29879470</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30071-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caicedo-Torres</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>ISeeU: visually interpretable deep learning for mortality prediction inside the ICU</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <volume>98</volume>
          <fpage>103269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30188-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103269</pub-id>
          <pub-id pub-id-type="medline">31430550</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30188-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahsan</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmud</surname>
              <given-names>MAP</given-names>
            </name>
            <name name-style="western">
              <surname>Saha</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Siddique</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Effect of data scaling methods on machine learning algorithms and model performance</article-title>
          <source>Technologies</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>52</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/2227-7080/9/3/52"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/technologies9030052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brucher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>É</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <issue>85</issue>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/v12/pedregosa11a.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saria</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rajani</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Gould</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koller</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Penn</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Integration of early physiological responses predicts later illness severity in preterm infants</article-title>
          <source>Sci Transl Med</source>
          <year>2010</year>
          <volume>2</volume>
          <issue>48</issue>
          <fpage>48ra65</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20826840"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/scitranslmed.3001304</pub-id>
          <pub-id pub-id-type="medline">20826840</pub-id>
          <pub-id pub-id-type="pii">2/48/48ra65</pub-id>
          <pub-id pub-id-type="pmcid">PMC3564961</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>EF</given-names>
            </name>
            <name name-style="western">
              <surname>Dyachenko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ciampi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maurel</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Warrick</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Garite</surname>
              <given-names>TJ</given-names>
            </name>
          </person-group>
          <article-title>Estimating risk of severe neonatal morbidity in preterm births under 32 weeks of gestation</article-title>
          <source>J Matern Fetal Neonatal Med</source>
          <year>2020</year>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>73</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1080/14767058.2018.1487395</pub-id>
          <pub-id pub-id-type="medline">29886760</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crowson</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Moukheiber</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Arévalo</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Mantena</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goss</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of federated learning applications for biomedical data</article-title>
          <source>PLOS Digit Health</source>
          <year>2022</year>
          <volume>1</volume>
          <issue>5</issue>
          <fpage>e0000033</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36812504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000033</pub-id>
          <pub-id pub-id-type="medline">36812504</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-22-00011</pub-id>
          <pub-id pub-id-type="pmcid">PMC9931322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>TV</given-names>
            </name>
            <name name-style="western">
              <surname>Dakka</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Diakiw</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>VerMilyea</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Perugini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>JMM</given-names>
            </name>
            <name name-style="western">
              <surname>Perugini</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A novel decentralized federated learning approach to train on globally distributed, poor quality, and protected private medical data</article-title>
          <source>Sci Rep</source>
          <year>2022</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>8888</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/s41598-022-12833-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-022-12833-x</pub-id>
          <pub-id pub-id-type="medline">35614106</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-022-12833-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC9133021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>IY</given-names>
            </name>
            <name name-style="western">
              <surname>Johansson</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Why is my classifier discriminatory?</article-title>
          <year>2018</year>
          <conf-name>Proceedings of the 32nd International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 3-8, 2018</conf-date>
          <conf-loc>Montréal, Canada</conf-loc>
          <fpage>3543</fpage>
          <lpage>3554</lpage>
          <pub-id pub-id-type="doi">10.5555/3327144.3327272</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>IY</given-names>
            </name>
            <name name-style="western">
              <surname>Pierson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ferryman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Ethical machine learning in healthcare</article-title>
          <source>Annu Rev Biomed Data Sci</source>
          <year>2021</year>
          <volume>4</volume>
          <fpage>123</fpage>
          <lpage>144</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34396058"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-biodatasci-092820-114757</pub-id>
          <pub-id pub-id-type="medline">34396058</pub-id>
          <pub-id pub-id-type="pmcid">PMC8362902</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seinen</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Fridgeirsson</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jeannetot</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Markus</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Pera</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rekkas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Rijnbeek</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Use of unstructured text in prognostic clinical prediction models: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2022</year>
          <volume>29</volume>
          <issue>7</issue>
          <fpage>1292</fpage>
          <lpage>1302</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35475536"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocac058</pub-id>
          <pub-id pub-id-type="medline">35475536</pub-id>
          <pub-id pub-id-type="pii">6574714</pub-id>
          <pub-id pub-id-type="pmcid">PMC9196702</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
