<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i5e38241</article-id>
      <article-id pub-id-type="pmid">35536634</article-id>
      <article-id pub-id-type="doi">10.2196/38241</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Predicting Postoperative Mortality With Deep Neural Networks and Natural Language Processing: Model Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Elbattah</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Pei-Fu</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0192-5377</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Lichin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2122-1625</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Yow-Kuan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8026-5671</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Guo-Hung</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1803-3682</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Lai</surname>
            <given-names>Feipei</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff05" ref-type="aff">5</xref>
          <xref rid="aff06" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7147-8122</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Cheng-Wei</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2217-3231</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Chi-Yu</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff08" ref-type="aff">8</xref>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5793-0397</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Kuan-Chih</given-names>
          </name>
          <degrees>MD, MSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6526-8097</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Tzu-Yu</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <address>
            <institution>Department of Anesthesiology</institution>
            <institution>Far Eastern Memorial Hospital</institution>
            <addr-line>No 21, Sec 2, Nanya S Rd</addr-line>
            <addr-line>Banciao Dist</addr-line>
            <addr-line>New Taipei City, 220216</addr-line>
            <country>Taiwan</country>
            <fax>886 2 89665567</fax>
            <phone>886 2 89667000</phone>
            <email>drlin1971@gmail.com</email>
          </address>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1374-5189</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>Graduate Institute of Biomedical Electronics and Bioinformatics</institution>
        <institution>National Taiwan University</institution>
        <addr-line>Taipei</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>Department of Anesthesiology</institution>
        <institution>Far Eastern Memorial Hospital</institution>
        <addr-line>New Taipei City</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Research Center for Information Technology Innovation</institution>
        <institution>Academia Sinica</institution>
        <addr-line>Taipei</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>Department of Computer Science</institution>
        <institution>Columbia University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>Department of Computer Science and Information Engineering</institution>
        <institution>National Taiwan University</institution>
        <addr-line>Taipei</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>Department of Electrical Engineering</institution>
        <institution>National Taiwan University</institution>
        <addr-line>Taipei</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Department of Mechanical Engineering</institution>
        <institution>Yuan Ze University</institution>
        <addr-line>Taoyuan</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Department of Information Technology</institution>
        <institution>Far Eastern Memorial Hospital</institution>
        <addr-line>New Taipei City</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Section of Cardiovascular Medicine</institution>
        <institution>Cardiovascular Center</institution>
        <institution>Far Eastern Memorial Hospital</institution>
        <addr-line>New Taipei City</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Department of Internal Medicine</institution>
        <institution>Far Eastern Memorial Hospital</institution>
        <addr-line>New Taipei City</addr-line>
        <country>Taiwan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Tzu-Yu Lin <email>drlin1971@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>5</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>10</day>
        <month>5</month>
        <year>2022</year>
      </pub-date>
      <volume>10</volume>
      <issue>5</issue>
      <elocation-id>e38241</elocation-id>
      <history>
        <date date-type="received">
          <day>24</day>
          <month>3</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>26</day>
          <month>4</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Pei-Fu Chen, Lichin Chen, Yow-Kuan Lin, Guo-Hung Li, Feipei Lai, Cheng-Wei Lu, Chi-Yu Yang, Kuan-Chih Chen, Tzu-Yu Lin. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 10.05.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2022/5/e38241" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Machine learning (ML) achieves better predictions of postoperative mortality than previous prediction tools. Free-text descriptions of the preoperative diagnosis and the planned procedure are available preoperatively. Because reading these descriptions helps anesthesiologists evaluate the risk of the surgery, we hypothesized that deep learning (DL) models with unstructured text could improve postoperative mortality prediction. However, it is challenging to extract meaningful concept embeddings from this unstructured clinical text.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to develop a fusion DL model containing structured and unstructured features to predict the in-hospital 30-day postoperative mortality before surgery. ML models for predicting postoperative mortality using preoperative data with or without free clinical text were assessed.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We retrospectively collected preoperative anesthesia assessments, surgical information, and discharge summaries of patients undergoing general and neuraxial anesthesia from electronic health records (EHRs) from 2016 to 2020. We first compared the deep neural network (DNN) with other models using the same input features to demonstrate effectiveness. Then, we combined the DNN model with bidirectional encoder representations from transformers (BERT) to extract information from clinical texts. The effects of adding text information on the model performance were compared using the area under the receiver operating characteristic curve (AUROC) and the area under the precision-recall curve (AUPRC). Statistical significance was evaluated using <italic>P</italic>&#60;.05.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The final cohort contained 121,313 patients who underwent surgeries. A total of 1562 (1.29%) patients died within 30 days of surgery. Our BERT-DNN model achieved the highest AUROC (0.964, 95% CI 0.961-0.967) and AUPRC (0.336, 95% CI 0.276-0.402). The AUROC of the BERT-DNN was significantly higher compared to logistic regression (AUROC=0.952, 95% CI 0.949-0.955) and the American Society of Anesthesiologist Physical Status (ASAPS AUROC=0.892, 95% CI 0.887-0.896) but not significantly higher compared to the DNN (AUROC=0.959, 95% CI 0.956-0.962) and the random forest (AUROC=0.961, 95% CI 0.958-0.964). The AUPRC of the BERT-DNN was significantly higher compared to the DNN (AUPRC=0.319, 95% CI 0.260-0.384), the random forest (AUPRC=0.296, 95% CI 0.239-0.360), logistic regression (AUPRC=0.276, 95% CI 0.220-0.339), and the ASAPS (AUPRC=0.149, 95% CI 0.107-0.203).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our BERT-DNN model has an AUPRC significantly higher compared to previously proposed models using no text and an AUROC significantly higher compared to logistic regression and the ASAPS. This technique helps identify patients with higher risk from the surgical description text in EHRs.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>bidirectional encoder representations from transformers</kwd>
        <kwd>deep neural network</kwd>
        <kwd>natural language processing</kwd>
        <kwd>postoperative mortality prediction</kwd>
        <kwd>unstructured text</kwd>
        <kwd>machine learning</kwd>
        <kwd>preoperative medicine</kwd>
        <kwd>anesthesia</kwd>
        <kwd>prediction model</kwd>
        <kwd>anesthesiologist</kwd>
        <kwd>deep learning model</kwd>
        <kwd>electronic health record</kwd>
        <kwd>neural network</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The prevalence of postoperative mortality is 0.5%-2.8 % in patients undergoing elective surgery [<xref ref-type="bibr" rid="ref1">1</xref>]. The risks are attributable to the patient’s condition and can be modulated with adequate evaluation and planning during surgery and anesthesia. Several tools have been developed to predict postoperative mortality, including the American College of Surgeons’ (ACS) National Surgical Quality Improvement Program (NSQIP) risk calculator, the American Society of Anesthesiologist Physical Status (ASAPS), the risk quantification index, the risk stratification index, and the preoperative score [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. Although these classification systems consider the patient’s general condition and surgery category, preoperative vital signs and laboratory data—which are critical in predicting postoperative mortality—are not typically included [<xref ref-type="bibr" rid="ref6">6</xref>]. Moreover, a patient’s surgical information is commonly written as text in the medical record. Although reading this information helps anesthesiologists evaluate the risk of the surgery, it is difficult to include it in a classification tool. These deficiencies make it challenging to identify the small groups of patients with higher risks. Better tools for predicting postoperative mortality remain under investigation.</p>
      <p>Machine learning (ML) is widely applied to medical problems, including for predicting postoperative mortality [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. ML models can automatically predict postoperative mortality using electronic health records (EHRs) before surgery, and they achieve a superior area under the receiver operating characteristic curve (AUROC) than previous methods [<xref ref-type="bibr" rid="ref6">6</xref>]. To stratify surgery types, previous studies have used the Current Procedural Terminology (CPT) codes or <italic>International Classification of Diseases</italic> (ICD) codes for surgical information [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. These methods are not widely applicable, because the CPT is not implemented worldwide and ICD codes are seldom recorded before surgery. In addition, because this surgical information is written in the medical record by surgeons before surgery, using this text in models may improve the prediction of postoperative mortality.</p>
      <p>Compared to structured EHRs, unstructured clinical text requires meaningful concept embeddings to be extracted before model training, making it more challenging [<xref ref-type="bibr" rid="ref13">13</xref>]. However, including this unstructured text improves the advanced prediction of unfavorable clinical outcomes [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. Bidirectional encoder representations from transformers (BERT) is a contextualized embedding method that preserves the distance of meanings with multihead attention [<xref ref-type="bibr" rid="ref17">17</xref>]. After pretrained on the relevant corpora and proper architecture modification, BERT extracts meaningful embeddings from clinical text [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>This study aims to develop a model to predict 30-day postoperative mortality before surgery that performs better than state-of-the-art models. Our contribution is including free (ie, unstructured) text in postoperative mortality prediction by proposing a deep neural network (DNN) model with BERT. We investigate the effectiveness of unstructured clinical texts (eg, preoperative diagnosis and proposed procedures) in predicting postoperative mortality.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Extraction</title>
        <p>This study aims to predict in-hospital 30-day postoperative mortality using preoperative anesthesia assessments. Data were collected from the electronic health system of the Far Eastern Memorial Hospital, a large academic medical center in Taiwan. Preoperative anesthesia assessment records and discharge summaries were included. Overall, 5 years’ worth of retrospective data were collected from January 1, 2016, to December 30, 2020. The last version of the anesthesia assessment was included for each surgery. Patients over 18 years of age who underwent at least 1 surgical procedure under general or neuraxial anesthesia were included. Cases with an ASAPS of 6 were excluded. Records lacking entry time, exit time, preoperative diagnosis, or proposed procedure text were excluded. The in-hospital 30-day postoperative mortality was defined by a discharged route of “expired” and “critical against-advice discharge” (when the patient wants to die at home) without future admission. Discharges within 30 days after surgery were identified and labeled as “true”; those occurring outside this window were marked as “false.” The end date of the testing set was November 30, 2020, 30 days before the end of the collected data, to ensure complete 30-day mortality detection (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow diagram. ASAPS: American Society of Anesthesiologist Physical Status.</p>
          </caption>
          <graphic xlink:href="medinform_v10i5e38241_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Approval</title>
        <p>The Institutional Review Board of the Far Eastern Memorial Hospital approved this retrospective study and waived the requirement of informed consent (#109129-F and #110028-F).</p>
      </sec>
      <sec>
        <title>Data Description</title>
        <p>We collected 123,718 surgery results for patients aged over 18 years. After applying the exclusion criteria, a cohort of 123,515 (99.8%) patients who underwent surgeries remained. A final cohort of 121,313 (98.2%) patients was used after removing those who underwent surgeries after November 30, 2020 (<xref rid="figure1" ref-type="fig">Figure 1</xref>). The training, validation, and testing cohorts finally contained 79,324 (68.7%), 19,832 (17.2%), and 16,267 (14.1%) of 115,423 patients. Patient characteristics of the training, validation, and testing cohorts are listed in <xref ref-type="table" rid="table1">Table 1</xref>. In the overall cohort, most patients had an ASAPS of 2 or 3. Overall, 107,176 (88.5%) of patients were under general anesthesia. The most prevalent comorbidities were hypertension (n=43,391, 35.8%), followed by diabetes (n=24,314, 20.0%). A total of 1562 (1.3%), 997 (1.3%), 249 (1.3%), and 215 (1.3%) patients died within 30 days of surgery in the overall, training, validation, and testing cohorts, respectively. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> present a summary of the laboratory data and preoperative vital signs.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Characteristics of the cohort. Categorical variables are represented as frequency (%). Continuous variables are represented as the median (25th, 75th percentile). The testing cohort was split by time between the training and validation cohorts, and those cases arising from the training and validation cohorts were removed to prevent data leakage (n=5890, 4.9%).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="320"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Feature</td>
                <td colspan="2">Training cohort (N=79,324)</td>
                <td colspan="2">Validation cohort (N=19,832)</td>
                <td colspan="2">Testing cohort (N=16,267)</td>
                <td>Overall cohort (N=121,313)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age (years), median (25th, 75th percentile)</td>
                <td colspan="2">54 (40, 66)</td>
                <td colspan="2">54 (40, 66)</td>
                <td colspan="2">53 (39, 65)</td>
                <td>55 (41, 66)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Male sex, n (%)</td>
                <td colspan="2">40,444 (51.0)</td>
                <td colspan="2">9922 (50.0)</td>
                <td colspan="2">8101 (49.8)</td>
                <td>61,485 (50.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Height (cm), median (25th, 75th percentile)</td>
                <td colspan="2">162 (157, 168)</td>
                <td colspan="2">162 (156, 168)</td>
                <td colspan="2">162 (157, 169)</td>
                <td>162 (157, 168)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Weight (kg), median (25th, 75th percentile)</td>
                <td colspan="2">64 (56, 74)</td>
                <td colspan="2">64 (56, 74)</td>
                <td colspan="2">65 (56, 75)</td>
                <td>64 (56, 74)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">BMI, median (25th, 75th percentile)</td>
                <td colspan="2">24 (22, 27)</td>
                <td colspan="2">24 (22, 27)</td>
                <td colspan="2">24 (22, 27)</td>
                <td>24 (22, 27)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>ASAPS<sup>a</sup>, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td colspan="2">2925 (3.7)</td>
                <td colspan="2">739 (3.7)</td>
                <td colspan="2">660 (4.1)</td>
                <td colspan="2">4404 (3.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td colspan="2">54,056 (68.15)</td>
                <td colspan="2">13,549 (68.3)</td>
                <td colspan="2">11,508 (70.7)</td>
                <td colspan="2">82,588 (68.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td colspan="2">20,842 (26.3)</td>
                <td colspan="2">5155 (26.0)</td>
                <td colspan="2">,654 (22.5)</td>
                <td colspan="2">31,878 (26.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td colspan="2">1345 (1.70)</td>
                <td colspan="2">355 (1.8)</td>
                <td colspan="2">397 (2.4)</td>
                <td colspan="2">2204 (1.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>5</td>
                <td colspan="2">156 (0.2)</td>
                <td colspan="2">34 (0.2)</td>
                <td colspan="2">48 (0.3)</td>
                <td colspan="2">239 (0.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">ASA<sup>b</sup> emergency, n (%)</td>
                <td colspan="2">6379 (8.0)</td>
                <td colspan="2">1615 (8.1)</td>
                <td colspan="2">1678 (10.3)</td>
                <td>9942 (8.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Anesthesia type, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>General</td>
                <td colspan="2">69,898 (88.3)</td>
                <td colspan="2">17,497 (88.4)</td>
                <td colspan="2">14,486 (89.2)</td>
                <td colspan="2">107,176 (88.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Neuraxial</td>
                <td colspan="2">9297 (11.7)</td>
                <td colspan="2">2303 (11.6)</td>
                <td colspan="2">1748 (10.8)</td>
                <td colspan="2">13,929 (11.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Emergency level of surgery, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Elective</td>
                <td colspan="2">62,226 (78.5)</td>
                <td colspan="2">15,455 (77.9)</td>
                <td colspan="2">12,000 (73.8)</td>
                <td colspan="2">94,816 (78.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urgent</td>
                <td colspan="2">13,800 (17.4)</td>
                <td colspan="2">3,567 (18.0)</td>
                <td colspan="2">3,356 (20.6)</td>
                <td colspan="2">21,342 (17.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Emergency</td>
                <td colspan="2">2849 (3.6)</td>
                <td colspan="2">708 (3.6)</td>
                <td colspan="2">801 (4.9)</td>
                <td colspan="2">4484 (3.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Immediate</td>
                <td colspan="2">449 (0.57)</td>
                <td colspan="2">102 (0.51)</td>
                <td colspan="2">110 (0.7)</td>
                <td colspan="2">671 (0.6)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Preoperative location, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Ward</td>
                <td colspan="2">47,187 (59.5)</td>
                <td colspan="2">11,788 (59.4)</td>
                <td colspan="2">9824 (60.4)</td>
                <td colspan="2">72,045 (59.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Outpatient</td>
                <td colspan="2">18,386 (23.2)</td>
                <td colspan="2">4463 (22.5)</td>
                <td colspan="2">2995 (18.4)</td>
                <td colspan="2">27,830 (22.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Emergency department</td>
                <td colspan="2">10,083 (12.7)</td>
                <td colspan="2">2592 (13.1)</td>
                <td colspan="2">2283 (14.0)</td>
                <td colspan="2">15,247 (12.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intensive care unit</td>
                <td colspan="2">3668 (4.6)</td>
                <td colspan="2">989 (5.0)</td>
                <td colspan="2">1165 (7.2)</td>
                <td colspan="2">6191 (5.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Surgery department, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urology</td>
                <td colspan="2">14,760 (18.6)</td>
                <td colspan="2">3630 (18.3)</td>
                <td colspan="2">2665 (16.4)</td>
                <td colspan="2">22,471 (18.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>General</td>
                <td colspan="2">11,416 (14.4)</td>
                <td colspan="2">2926 (14.8)</td>
                <td colspan="2">2457 (15.1)</td>
                <td colspan="2">17,608 (14.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Orthopedics</td>
                <td colspan="2">10,976 (13.8)</td>
                <td colspan="2">2748 (13.9)</td>
                <td colspan="2">2338 (14.4)</td>
                <td colspan="2">16,772 (13.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gynecology<sup>c</sup></td>
                <td colspan="2">10,206 (12.9)</td>
                <td colspan="2">2,578 (13.0)</td>
                <td colspan="2">2,302 (14.2)</td>
                <td colspan="2">15,679 (12.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cardiovascular</td>
                <td colspan="2">8692 (11.0)</td>
                <td colspan="2">2086 (10.5)</td>
                <td colspan="2">1491 (9.2)</td>
                <td colspan="2">13,049 (10.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Otolaryngology</td>
                <td colspan="2">6193 (7.8)</td>
                <td colspan="2">1505 (7.6)</td>
                <td colspan="2">1223 (7.5)</td>
                <td colspan="2">9427 (7.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Plastic surgery</td>
                <td colspan="2">5116 (6.5)</td>
                <td colspan="2">1294 (6.5)</td>
                <td colspan="2">1077 (6.6)</td>
                <td colspan="2">7821 (6.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Neurosurgery</td>
                <td colspan="2">3233 (4.1)</td>
                <td colspan="2">833 (4.2)</td>
                <td colspan="2">727 (4.5)</td>
                <td colspan="2">4955 (4.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Traumatology</td>
                <td colspan="2">2808 (3.5)</td>
                <td colspan="2">740 (3.7)</td>
                <td colspan="2">722 (4.4)</td>
                <td colspan="2">4357 (3.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Thoracic surgery</td>
                <td colspan="2">2006 (2.5)</td>
                <td colspan="2">514 (2.6)</td>
                <td colspan="2">430 (2.6)</td>
                <td colspan="2">3104 (2.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Colorectal surgery</td>
                <td colspan="2">1679 (2.1)</td>
                <td colspan="2">423 (2.1)</td>
                <td colspan="2">331 (2.0)</td>
                <td colspan="2">2574 (2.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Others</td>
                <td colspan="2">2239 (2.8)</td>
                <td colspan="2">555 (2.8)</td>
                <td colspan="2">504 (3.1)</td>
                <td colspan="2">3496 (2.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Comorbidity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diabetes mellitus</td>
                <td colspan="2">15,906 (20.1)</td>
                <td colspan="2">3863 (19.5)</td>
                <td colspan="2">2812 (17.3)</td>
                <td colspan="2">24,314 (20.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hyperlipidemia</td>
                <td colspan="2">8704 (11.0)</td>
                <td colspan="2">2119 (10.7)</td>
                <td colspan="2">1740 (10.7)</td>
                <td colspan="2">13,678 (11.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hypertension</td>
                <td colspan="2">28,462 (35.9)</td>
                <td colspan="2">7055 (35.6)</td>
                <td colspan="2">4999 (30.7)</td>
                <td colspan="2">43,391 (35.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior cerebrovascular accident</td>
                <td colspan="2">4355 (5.5)</td>
                <td colspan="2">1028 (5.2)</td>
                <td colspan="2">717 (4.4)</td>
                <td colspan="2">6564 (5.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cardiac disease</td>
                <td colspan="2">13,215 (16.7)</td>
                <td colspan="2">3254 (16.4)</td>
                <td colspan="2">2227 (13.7)</td>
                <td colspan="2">20,156 (16.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chronic obstructive pulmonary disease</td>
                <td colspan="2">1549 (2.0)</td>
                <td colspan="2">380 (1.9)</td>
                <td colspan="2">286 (1.8)</td>
                <td colspan="2">2428 (2.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asthma</td>
                <td colspan="2">3024 (3.8)</td>
                <td colspan="2">762 (3.8)</td>
                <td colspan="2">592 (3.6)</td>
                <td colspan="2">4626 (3.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hepatic disease</td>
                <td colspan="2">9118 (11.5)</td>
                <td colspan="2">2299 (11.6)</td>
                <td colspan="2">1664 (10.2)</td>
                <td colspan="2">13,887 (11.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Renal disease</td>
                <td colspan="2">12,471 (15.7)</td>
                <td colspan="2">3095 (15.6)</td>
                <td colspan="2">1466 (9.0)</td>
                <td colspan="2">18,874 (15.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bleeding disorder</td>
                <td colspan="2">11,243 (14.2)</td>
                <td colspan="2">2684 (13.5)</td>
                <td colspan="2">2122 (13.0)</td>
                <td colspan="2">17,543 (14.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior major operations</td>
                <td colspan="2">54,356 (68.5)</td>
                <td colspan="2">13,592 (68.5)</td>
                <td colspan="2">10,040 (61.7)</td>
                <td colspan="2">83,490 (68.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Smoking</td>
                <td colspan="2">20,235 (25.5)</td>
                <td colspan="2">5098 (25.7)</td>
                <td colspan="2">3719 (22.9)</td>
                <td colspan="2">30,433 (25.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Drug allergy</td>
                <td colspan="2">11,662 (14.7)</td>
                <td colspan="2">2959 (14.9)</td>
                <td colspan="2">2190 (13.5)</td>
                <td colspan="2">18,092 (14.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Consciousness</td>
                <td colspan="2">69,858 (88.1)</td>
                <td colspan="2">17,461 (88.0)</td>
                <td colspan="2">15,107 (92.9)</td>
                <td colspan="2">107,906 (88.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">30-day mortality, n (%)</td>
                <td colspan="2">997 (1.3)</td>
                <td colspan="2">249 (1.3)</td>
                <td colspan="2">215 (1.3)</td>
                <td>1562 (1.3)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>ASAPS: American Society of Anesthesiologist Physical Status.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>ASA: American Society of Anesthesiologists.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>The gynecology department consists of gynecology and obstetrics.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Preparation</title>
        <p>The input features included patient characteristics (age, height, weight, BMI, sex, ASAPS, ASA emergency status, department, preoperative location, and anesthesia type), surgery characteristics (emergency level, preoperative diagnosis, and proposed procedure), comorbidities (diabetes mellitus, hyperlipidemia, hypertension, cerebrovascular accident, cardiac disease, chronic obstructive pulmonary disease, asthma, hepatic disease, renal disease, bleeding disorder, major operations, smoking, and drug allergy), preoperative laboratory data (hemoglobin, platelet, international normalized ratio, prothrombin time, activated partial thromboplastin time, creatinine, aspartate transaminase, alanine transaminase, blood sugar, serum sodium, and serum potassium), and preoperative vital signs (body temperature, oxygen saturation, heart rate, respiratory rate, systolic and diastolic blood pressure, and consciousness status); see <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>Continuous features (eg, age, height, weight, latest laboratory data before surgery, and preoperative vital signs) were standardized by subtracting the mean and scaling to variance. Outliers were regarded as input errors and treated as missing data. <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> lists the definitions of the outliers. Missing values were imputed with the median value of the data set for continuous features.</p>
        <p>Categorical features with only 2 classes (eg, sex, comorbidities, ASA emergency status, and consciousness status) were converted into binary encoding. All other categorical features (eg, ASAPS [5 classes], department [22 classes], emergency level [4 classes], preoperative location [4 classes], and anesthesia type [4 classes]) were transformed into one-hot encodings. Missing data were imputed with the majority category of the training data set. The preoperative diagnoses and proposed procedures were expressed as free text. Characters other than alphabetical and numerical ones were removed (eg, Chinese characters [typically notes for colleagues only] and punctuation). English stop words providing no helpful information to the model (eg, “a,” “in,” and “the”) were removed using the Natural Language Toolkit [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
        <p>We used the previous 4 years’ surgery results to predict the last year results. Patients who underwent surgeries between January 1, 2016, and December 31, 2019, were selected and split into training and validation sets in a 4:1 ratio; those who underwent surgeries between January 1, 2020, and November 30, 2020, were selected as the testing set (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Patients in the training or validation set were removed from the testing set to prevent information leakage [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Feature groups included in the models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="180"/>
            <col width="790"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Feature type</td>
                <td>Feature classes<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Patient characteristics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Continuous</td>
                <td>Age, height, weight, BMI</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Categorical</td>
                <td>Sex (2), ASAPS<sup>b</sup> (5), ASA<sup>c</sup> emergency (2), department (22), preoperative location (4), anesthesia type (4)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Surgery characteristics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Categorical</td>
                <td>Emergency level (4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Free text</td>
                <td>Preoperative diagnosis, proposed procedure</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Comorbid conditions</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Categorical</td>
                <td>Diabetes mellitus (2), hyperlipidemia (2), hypertension (2), cerebrovascular accident (2), cardiac disease (2), chronic obstructive pulmonary disease (2), asthma (2), hepatic disease (2), renal disease (2), bleeding disorder (2), major operations (2), smoking (2), drug allergy (2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Preoperative laboratory values</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Continuous</td>
                <td>Hemoglobin, platelet, international normalized ratio, prothrombin time, activated partial thromboplastin time, creatinine, aspartate transaminase, alanine transaminase, blood sugar, serum sodium, serum potassium</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Preoperative vital signs</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Continuous</td>
                <td>Body temperature, oxygen saturation, heart rate, respiratory rate, systolic and diastolic blood pressure</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Categorical</td>
                <td>Consciousness status (2)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>The number of classes is shown in parentheses.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ASAPS: American Society of Anesthesiologist Physical Status.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>ASA: American Society of Anesthesiologists.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Study Design</title>
        <p>Our results were compared with state-of-the-art models, using patient preoperative vital signs and laboratory data to predict in-hospital 30-day mortality [<xref ref-type="bibr" rid="ref6">6</xref>]. Meanwhile, to demonstrate the effect of adding preoperative diagnoses and proposed procedures to the prediction model, we added text features and compared the performances of the highest-performing models.</p>
        <p>First, we compared the state-of-the-art models using patient and surgery characteristics (without text), comorbidities, preoperative vital signs, and laboratory data to predict the in-hospital 30-day mortality. <xref rid="figure2" ref-type="fig">Figure 2</xref>B shows our proposed DNN model with 4 fully connected (FC) layers and a Softmax layer output function. We compared our DNN model with other ML models, including a random forest classifier (with 2000 estimators and Gini impurity as the splitting criterion) [<xref ref-type="bibr" rid="ref21">21</xref>], extreme gradient boosting (XGBoost, with a learning rate of 0.3 and a maximum depth of 6) [<xref ref-type="bibr" rid="ref22">22</xref>], and logistic regression (with an L2 penalty); see <xref rid="figure2" ref-type="fig">Figure 2</xref>A. To balance the data while training the ML models, oversampling by 78 times was performed on the training set via the synthetic minority oversampling technique; this produced synthetic samples along a straight line between randomly selected samples in the feature space [<xref ref-type="bibr" rid="ref23">23</xref>]. While training our DNN model, we adjusted the weight to compensate for the imbalanced classes. We added the text of preoperative diagnoses and proposed procedures to the DNN model architecture (denoted as BERT-DNN; see <xref rid="figure2" ref-type="fig">Figure 2</xref>C) and compared its performance with those of other models.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Architectures of models. BERT: bidirectional encoder representations from transformers: DNN: deep neural network; FC: fully connected; ML: machine learning; ReLU: rectified linear unit; XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="medinform_v10i5e38241_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Language Model and BERT-DNN Model Design</title>
        <p>The language model extracted features from the preprocessed text. <xref rid="figure2" ref-type="fig">Figure 2</xref>C shows the architecture of the language model. The preprocessed texts were tokenized using the BERT tokenizer, which transformed each word fragment into a unique token designed for use in BERT’s pretraining process [<xref ref-type="bibr" rid="ref17">17</xref>]. Then, these tokens were embedded by Bio+Clinical BERT, a variant of BERT pretrained on text from PubMed and Medical Information Mart for Intensive Care III [<xref ref-type="bibr" rid="ref24">24</xref>]. The text information was transformed into a 768-dimension vector (the “word embeddings”) at the pooler output layer [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. These word embeddings were input into 2 FC layers before concatenation with other structured features. The concatenated vectors were input into 3 FC layers and a Softmax layer output function. <xref rid="figure2" ref-type="fig">Figure 2</xref>C shows the architecture of the BERT-DNN model.</p>
        <p>Cross-entropy was used as the loss function. Class weight imbalances were compensated for by setting the weights as the inverses of the different classes’ frequencies (~1:78). Further, the training data were split into training and validating sets in a 4:1 ratio to train the deep learning (DL) model. We used AdamW from the PyTorch package as the optimizer, setting a learning rate of 0.00002 for both DL models. We trained our BERT-DNN and DNN models with batch sizes of 64 and 512, respectively, until the 100th epoch. The DL model with the smallest validation loss was selected for performance comparison.</p>
      </sec>
      <sec>
        <title>Model Evaluation</title>
        <p>The models were evaluated using the AUROC, the area under the precision-recall curve (AUPRC), sensitivity (also referred to as recall), specificity, precision (also called the positive predictive value), and the F1 score. The F1 score was a harmonic mean of recall and precision and was calculated as 2/[(1/recall) + (1/precision)]. Because postoperative mortalities accounted for 1.3% (1562/121,313) of our data set, classes were extremely imbalanced between the positive and negative groups. Here, the AUPRC (which calculated the average precision) was better than the AUROC for evaluating the discrimination of models [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. For comparison of AUROCs, we applied a nonparametric approach proposed by DeLong et al [<xref ref-type="bibr" rid="ref27">27</xref>] to calculate the SE of the area and the <italic>P</italic> value. <italic>P</italic>&#60;.05 was regarded statistically significant. We calculated exact binomial 95% CIs for the AUROC. For comparison of AUPRCs, we performed bootstrapping 1000 times in the testing set to calculate the difference in areas and the 95% CI [<xref ref-type="bibr" rid="ref28">28</xref>]. If the 95% CI for the difference in areas does not include 0, it can be concluded that these 2 areas are significantly different (<italic>P</italic>&#60;.05). We performed bootstrapping 1000 times in the testing set to calculate the 95% CI for other metrics [<xref ref-type="bibr" rid="ref6">6</xref>]. The predicted probabilities were calibrated using the histogram bins technique, using the same observed mortality in each bin of the validation set [<xref ref-type="bibr" rid="ref8">8</xref>]. After calibration, the mean observed incidences of mortality were plotted against the mean predicted probabilities within groups in the testing set.</p>
      </sec>
      <sec>
        <title>Visualization of Word Embeddings</title>
        <p>To show the correlation between increased prediction probabilities and text inputs, the <italic>t</italic> distributed stochastic neighbor embedding (SNE) was implemented by reducing the 768 dimensions of the language model’s pool output to 2 into a plane [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Thus, we showed the clustering of word embeddings using assorted colors for different predicted probabilities and different icons for observed mortalities. We randomly resampled 10,000 and 5000 patients who underwent surgeries in the training and testing sets, respectively, to construct this visualization. The language-model-predicted probabilities and observed mortalities for randomly selected text inputs were calculated and listed.</p>
        <p>The study was implemented using Python 3.9, Scikit-learn 0.24 [<xref ref-type="bibr" rid="ref31">31</xref>], imbalanced-learn 0.8.0 [<xref ref-type="bibr" rid="ref23">23</xref>], PyTorch 1.8 [<xref ref-type="bibr" rid="ref32">32</xref>], and transformers 4.9 (Hugging Face) [<xref ref-type="bibr" rid="ref24">24</xref>]. Our models were trained and validated on the NVIDIA Tesla P100-PCIE-16GB graphics processing unit (GPU). The statistical significances of AUROCs and AUPRCs were calculated using MedCalc software (Ostend, Belgium).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Comparison of Machine Learning Models</title>
        <p>The BERT-DNN had the highest AUROC of 0.964 (95% CI 0.961-0.967) and the highest AUPRC of 0.336 (95% CI 0.276-0.402); see <xref ref-type="table" rid="table3">Table 3</xref> and <xref rid="figure3" ref-type="fig">Figure 3</xref>. The random forest achieved the second-highest AUROC of 0.961 (95% CI 0.958-0.964), and the DNN achieved the second-highest AUPRC of 0.319 (95% CI 0.260-0.384). The BERT-DNN model had the highest F1 score of 0.347 (95% CI 0.305-0.388).</p>
        <p>The BERT-DNN had a significantly higher AUROC compared to XGBoost, logistic regression, and ASAPS but not a significantly higher AUROC compared to the DNN and the random forest (<xref ref-type="table" rid="table4">Table 4</xref>). The BERT-DNN also had a significantly higher AUPRC compared to the DNN, random forest, XGBoost, logistic regression, and ASAPS (<xref ref-type="table" rid="table5">Table 5</xref>).</p>
        <p>In the BERT-DNN model, when the predicted probability of mortality increased from 0.2% to 39.4%, the observed incidence increased from 0.2% to 42.7% (<xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Prediction performances of ML<sup>a</sup> models and ASAPS<sup>b</sup> on the testing cohort with 95% CIs.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="130"/>
            <col width="120"/>
            <col width="130"/>
            <col width="120"/>
            <col width="130"/>
            <col width="120"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>AUROC<sup>c</sup> (95% CI)</td>
                <td>AUPRC<sup>d</sup> (95% CI)</td>
                <td>Accuracy<sup>e</sup> (95% CI)</td>
                <td>Sensitivity<sup>e</sup> (95% CI)</td>
                <td>Specificity<sup>e</sup> (95% CI)</td>
                <td>Precision<sup>a</sup> (95% CI)</td>
                <td>F1 score<sup>e</sup> (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>BERT<sup>f</sup>-DNN<sup>g</sup></td>
                <td>0.964 (0.961-0.967)</td>
                <td>0.336 (0.276-0.402)</td>
                <td>0.955 (0.952-0.958)</td>
                <td>0.749 (0.689-0.805)</td>
                <td>0.958 (0.955-0.961)</td>
                <td>0.193 (0.166-0.219)</td>
                <td>0.307 (0.269-0.342)</td>
              </tr>
              <tr valign="top">
                <td>DNN</td>
                <td>0.959 (0.956-0.962)</td>
                <td>0.319 (0.260-0.384)</td>
                <td>0.913 (0.909-0.917)</td>
                <td>0.885 (0.841-0.926)</td>
                <td>0.913 (0.909-0.918)</td>
                <td>0.120 (0.104-0.136)</td>
                <td>0.212 (0.187-0.236)</td>
              </tr>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.961 (0.958-0.964)</td>
                <td>0.296 (0.239-0.360)</td>
                <td>0.986 (0.984-0.988)</td>
                <td>0.167 (0.122-0.222)</td>
                <td>0.997 (0.996-0.998)</td>
                <td>0.445 (0.341-0.557)</td>
                <td>0.242 (0.182-0.314)</td>
              </tr>
              <tr valign="top">
                <td>XGBoost<sup>h</sup></td>
                <td>0.950 (0.946-0.953)</td>
                <td>0.281 (0.225-0.345)</td>
                <td>0.986 (0.984-0.987)</td>
                <td>0.195 (0.144-0.249)</td>
                <td>0.996 (0.995-0.997)</td>
                <td>0.409 (0.312-0.500)</td>
                <td>0.263 (0.201-0.326)</td>
              </tr>
              <tr valign="top">
                <td>Logistic regression</td>
                <td>0.952 (0.949-0.955)</td>
                <td>0.276 (0.220-0.339)</td>
                <td>0.904 (0.900-0.909)</td>
                <td>0.833 (0.780-0.882)</td>
                <td>0.905 (0.901-0.910)</td>
                <td>0.105 (0.091-0.119)</td>
                <td>0.187 (0.164-0.210)</td>
              </tr>
              <tr valign="top">
                <td>ASAPS</td>
                <td>0.892 (0.887-0.896)</td>
                <td>0.149 (0.107-0.203)</td>
                <td>0.970 (0.968-0.973)</td>
                <td>0.409 (0.342-0.478)</td>
                <td>0.978 (0.975-0.980)</td>
                <td>0.197 (0.160-0.235)</td>
                <td>0.266 (0.220-0.310)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>ML: machine learning.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>ASAPS: American Society of Anesthesiologist Physical Status.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>AUROC: area under the receiver operating characteristic.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>AUPRC: area under the precision-recall curve.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>These metrics were calculated without adjusting the threshold (using 0.5 as the cut-off).</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>BERT: bidirectional encoder representations from transformers.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>DNN: deep neural network.</p>
            </fn>
            <fn id="table3fn8">
              <p><sup>h</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Comparison of discrimination of different models. (A) AUROC. (B) AUPRC. ASAPS: American Society of Anesthesiologist Physical Status; AUPRC: area under the precision-recall curve; AUROC: area under the receiver operating characteristic curve; BERT: bidirectional encoder representations from transformers; DNN: deep neural network; XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="medinform_v10i5e38241_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Statistical significances of AUROCs<sup>a</sup> of different models. Values are <italic>P</italic> values. We applied a nonparametric approach proposed by DeLong et al [<xref ref-type="bibr" rid="ref27">27</xref>] to calculate the SE of the area and the <italic>P</italic> value.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="160"/>
            <col width="150"/>
            <col width="160"/>
            <col width="170"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>BERT<sup>b</sup>-DNN<sup>c</sup></td>
                <td>DNN</td>
                <td>Random forest</td>
                <td>XGBoost<sup>d</sup></td>
                <td>Logistic regression</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>ASAPS<sup>e</sup></td>
                <td>&#60;0.0001<sup>f</sup></td>
                <td>&#60;0.0001<sup>f</sup></td>
                <td>&#60;0.0001<sup>f</sup></td>
                <td>&#60;0.0001<sup>f</sup></td>
                <td>&#60;0.0001<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td>Logistic regression</td>
                <td>0.0005<sup>f</sup></td>
                <td>0.0711</td>
                <td>0.0351<sup>f</sup></td>
                <td>0.6451</td>
                <td>N/A<sup>g</sup></td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.0025<sup>f</sup></td>
                <td>0.0939</td>
                <td>0.0262<sup>f</sup></td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.3816</td>
                <td>0.5972</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>DNN</td>
                <td>0.0944</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>BERT: bidirectional encoder representations from transformers.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>DNN: deep neural network.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table4fn5">
              <p><sup>e</sup>ASAPS: American Society of Anesthesiologist Physical Status.</p>
            </fn>
            <fn id="table4fn6">
              <p><sup>f</sup>The difference in areas achieved statistical significance (<italic>P</italic>&#60;.05).</p>
            </fn>
            <fn id="table4fn7">
              <p><sup>g</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Statistical significances of AUPRCs<sup>a</sup> of different models. Values are differences in areas with 95% CIs calculated by bootstrapping 1000 times [<xref ref-type="bibr" rid="ref28">28</xref>]. If the 95% CI for the difference in areas does not include 0, it can be concluded that these 2 areas are significantly different (<italic>P</italic>&#60;.05).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="170"/>
            <col width="150"/>
            <col width="180"/>
            <col width="160"/>
            <col width="190"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>BERT<sup>b</sup>-DNN<sup>c</sup>, difference in areas (95% CI)</td>
                <td>DNN, difference in areas (95% CI)</td>
                <td>Random forest, difference in areas (95% CI)</td>
                <td>XGBoost<sup>d</sup>, difference in areas (95% CI)</td>
                <td>Logistic regression, difference in areas (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>ASAPS<sup>e</sup></td>
                <td>0.188 (0.159-0.221)<sup>f</sup></td>
                <td>0.170 (0.137-0.201)<sup>f</sup></td>
                <td>0.147 (0.122-0.177)<sup>f</sup></td>
                <td>0.133 (0.107-0.162)<sup>f</sup></td>
                <td>0.127 (0.101-0.154)<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td>Logistic regression</td>
                <td>0.061 (0.051-0.073)<sup>f</sup></td>
                <td>0.043 (0.021-0.056)<sup>f</sup></td>
                <td>0.020 (0.006-0.031)<sup>f</sup></td>
                <td>0.006 (–0.006 to 0.014)</td>
                <td>N/A<sup>g</sup></td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.055 (0.044-0.068)<sup>f</sup></td>
                <td>0.038 (0.024-0.046)<sup>f</sup></td>
                <td>0.015 (0.005-0.022)<sup>f</sup></td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.040 (0.030-0.054)<sup>f</sup></td>
                <td>0.023 (0.010-0.032)<sup>f</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>DNN</td>
                <td>0.018 (0.008-0.037)<sup>f</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>AUPRC: area under the precision-recall curve.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>BERT: bidirectional encoder representations from transformers.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>DNN: deep neural network.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>ASAPS: American Society of Anesthesiologist Physical Status.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>The difference in areas achieved statistical significance (<italic>P</italic>&#60;.05).</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Calibration plot. The observed incidence of mortality was plotted against the calibrated predicted probability of mortality among patients in the test cohort (n=16,267, 14.1%). Predicted probabilities were calibrated by applying the histogram binning technique in the validation cohort using 5 bins. Mean predicted probabilities of in-hospital 30-day mortality were calculated within each group.</p>
          </caption>
          <graphic xlink:href="medinform_v10i5e38241_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Visualization of Word Embeddings</title>
        <p>Because the observed mortalities were distributed concordantly with increased prediction probabilities, the annotated scatter plots showed that the text contributed to low- and high-probability predictions (<xref rid="figure5" ref-type="fig">Figure 5</xref>, <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). <xref ref-type="table" rid="table6">Table 6</xref> lists the probabilities predicted by the language model and the mortalities observed for a randomly selected text input.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Word embeddings visualized by t distributed stochastic neighbor embedding. (A) Word embeddings of the training set. (B) Word embeddings of the testing set. “Probs” indicates probabilities predicated by the BERT-DNN model. The intensity of color increased with the probability. “Labels” indicates mortalities by “x” and survivors by “•”. ards: acute respiratory distress syndrome; atfl: anterior talofibular ligament; avg: arteriovenous graft; avp: aortic valvuloplasty; BERT: bidirectional encoder representations from transformers; bct: breast-conserving therapy; bil: bilateral; bph: benign prostate hypertrophy; bx: biopsy; chr: chronic hypertrophic rhinitis; cps: chronic paranasal sinusitis; dbj: double J stent; DNN: deep neural network; ecmo: extracorporeal membrane oxygenation; emh: endometrial hemorrhage; esrd: end-stage renal disease; fess: functional endoscopic sinus surgery; itc: intertrochanter; ivg: intravenous general anesthesia; lih: left inguinal hernia; mvr: mitral valve replacement; nsd: nasal septum deviation; p: post; pcnl: percutaneous nephrolithotomy; perm cath: permanent catheter; psa: prostate-specific antigen; r: rule out; r’t: right; rirs: retrograde intrarenal surgery; rv: right ventricle; slnd: sentinel lymph node dissection; SNE: stochastic neighbor embedding; t colon: transverse colon; tee: transesophageal echocardiography; tep: total extraperitoneal approach; trus: transrectal ultrasound; turp: transurethral resection of the prostate; urs: ureteroscopy; vats: video-assisted thoracic surgery; vhd: valvular heart disease. Higher-resolution version of this figure available in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
          </caption>
          <graphic xlink:href="medinform_v10i5e38241_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Texts and their predicted probabilities by language model. Values are probabilities or mortalities.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="280"/>
            <col width="520"/>
            <thead>
              <tr valign="top">
                <td>Predicted probability</td>
                <td>Observed mortality (1=mortality; 0=no mortality)</td>
                <td>Original free text combining preoperative diagnosis and proposed procedures</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0.951</td>
                <td>1</td>
                <td>IHCA<sup>a</sup> p<sup>b</sup> CPR<sup>c</sup> ECMO<sup>d</sup> ACS<sup>e</sup> AR<sup>f</sup> full sternotomy CABG<sup>g</sup> AVR<sup>h</sup></td>
              </tr>
              <tr valign="top">
                <td>0.948</td>
                <td>0</td>
                <td>AMI<sup>i</sup> cardiogenic shock p ECMO remove ECMO TEE<sup>j</sup></td>
              </tr>
              <tr valign="top">
                <td>0.940</td>
                <td>1</td>
                <td>hollow organ perforation r<sup>k</sup> PPU<sup>l</sup> related LPPU<sup>m</sup> possible EXP LAP<sup>n</sup></td>
              </tr>
              <tr valign="top">
                <td>0.936</td>
                <td>1</td>
                <td>intra-abdominal bleeding EXP LAP</td>
              </tr>
              <tr valign="top">
                <td>0.932</td>
                <td>1</td>
                <td>ischemic bowel laparoscopic diagnosis possible EXP LAP</td>
              </tr>
              <tr valign="top">
                <td>0.927</td>
                <td>0</td>
                <td>acute pulmonary embolism IHCA p ECMO angiography TEE</td>
              </tr>
              <tr valign="top">
                <td>0.925</td>
                <td>1</td>
                <td>duodenal ulcer perforation p duodenorrhaphy leakage bleeding EXP LAP</td>
              </tr>
              <tr valign="top">
                <td>0.912</td>
                <td>0</td>
                <td>respiratory failure tracheostomy</td>
              </tr>
              <tr valign="top">
                <td>0.880</td>
                <td>0</td>
                <td>hallow organ perforation r PPU LPPU</td>
              </tr>
              <tr valign="top">
                <td>0.815</td>
                <td>0</td>
                <td>acute kidney failure perm cath<sup>o</sup> insertion</td>
              </tr>
              <tr valign="top">
                <td>0.760</td>
                <td>0</td>
                <td>post UPPP<sup>p</sup> wound bleeding check bleeding</td>
              </tr>
              <tr valign="top">
                <td>0.680</td>
                <td>0</td>
                <td>ESRD<sup>q</sup> HD<sup>r</sup> via right perm cath<sup>s</sup> qw2 4 6 perm cath dysfunction perm cath insertion change perm cath right neck</td>
              </tr>
              <tr valign="top">
                <td>0.527</td>
                <td>0</td>
                <td>ESRD left AVG<sup>t</sup> occlusion left AVG thrombectomy</td>
              </tr>
              <tr valign="top">
                <td>0.415</td>
                <td>0</td>
                <td>left lower leg soft tissue infection suspect necrotizing fasciitis debridement</td>
              </tr>
              <tr valign="top">
                <td>0.353</td>
                <td>0</td>
                <td>ESRD right AVF<sup>u</sup> dysfunction upper arm angiography PTA<sup>v</sup></td>
              </tr>
              <tr valign="top">
                <td>0.250</td>
                <td>0</td>
                <td>RLL<sup>w</sup> lung tumor r lung cancer vats RLL lobectomy wedge first send frozen exam</td>
              </tr>
              <tr valign="top">
                <td>0.186</td>
                <td>0</td>
                <td>left lower extremity NF<sup>x</sup> open BK<sup>y</sup></td>
              </tr>
              <tr valign="top">
                <td>0.114</td>
                <td>0</td>
                <td>left anterior mediastinal tumor multiple lung nodules rectal cancer p CCRT<sup>z</sup> VATS<sup>aa</sup> mediastinal tumor excision LAR<sup>ab</sup></td>
              </tr>
              <tr valign="top">
                <td>0.042</td>
                <td>0</td>
                <td>right ACL<sup>ac</sup> MCL<sup>ad</sup> injury arthroscopy ACL reconstruction</td>
              </tr>
              <tr valign="top">
                <td>0.041</td>
                <td>0</td>
                <td>1 C4 5 6 spondylosis 2 right carpal tunnel 1 ACDF<sup>ae</sup> C4 5 6 2 right median nerve decompression</td>
              </tr>
              <tr valign="top">
                <td>0.031</td>
                <td>0</td>
                <td>bil<sup>af</sup> ov<sup>ag</sup> teratoma laparoscopy adnexectomy</td>
              </tr>
              <tr valign="top">
                <td>0.030</td>
                <td>0</td>
                <td>left ureter stone URSL<sup>ah</sup> laser left</td>
              </tr>
              <tr valign="top">
                <td>0.029</td>
                <td>0</td>
                <td>uterine myoma robotic myomectomy</td>
              </tr>
              <tr valign="top">
                <td>0.029</td>
                <td>0</td>
                <td>acute appendicitis laparoscopic appendectomy</td>
              </tr>
              <tr valign="top">
                <td>0.029</td>
                <td>0</td>
                <td>hemorrhoids hemorrhoidectomy</td>
              </tr>
              <tr valign="top">
                <td>0.029</td>
                <td>0</td>
                <td>nontoxic goiter thyroidectomy</td>
              </tr>
              <tr valign="top">
                <td>0.027</td>
                <td>0</td>
                <td>infertility TVOR<sup>ai</sup></td>
              </tr>
              <tr valign="top">
                <td>0.027</td>
                <td>0</td>
                <td>endometrial polyp TCR<sup>aj</sup></td>
              </tr>
              <tr valign="top">
                <td>0.027</td>
                <td>0</td>
                <td>GA<sup>ak</sup> 38 weeks breech caesarean section</td>
              </tr>
              <tr valign="top">
                <td>0.025</td>
                <td>0</td>
                <td>rt<sup>al</sup> breast lesion MRI<sup>am</sup> guided biopsy</td>
              </tr>
              <tr valign="top">
                <td>0.025</td>
                <td>0</td>
                <td>right inguinal hernia TEP<sup>an</sup> right</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>IHCA: intrahospital cardiac arrest.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>p: post.</p>
            </fn>
            <fn id="table6fn3">
              <p><sup>c</sup>CPR: cardiopulmonary resuscitation.</p>
            </fn>
            <fn id="table6fn4">
              <p><sup>d</sup>ECMO: extracorporeal membrane oxygenation.</p>
            </fn>
            <fn id="table6fn5">
              <p><sup>e</sup>ACS: acute coronary syndrome.</p>
            </fn>
            <fn id="table6fn6">
              <p><sup>f</sup>AR: aortic regurgitation.</p>
            </fn>
            <fn id="table6fn7">
              <p><sup>g</sup>CABG: coronary artery bypass graft.</p>
            </fn>
            <fn id="table6fn8">
              <p><sup>h</sup>AVR: aortic valve replacement.</p>
            </fn>
            <fn id="table6fn9">
              <p><sup>i</sup>AMI: acute myocardial infarction.</p>
            </fn>
            <fn id="table6fn10">
              <p><sup>j</sup>TEE: transesophageal echocardiography.</p>
            </fn>
            <fn id="table6fn11">
              <p><sup>k</sup>r: rule out.</p>
            </fn>
            <fn id="table6fn12">
              <p><sup>l</sup>PPU: perforated peptic ulcer.</p>
            </fn>
            <fn id="table6fn13">
              <p><sup>m</sup>LPPU: laparoscopic perforated peptic ulcer surgery.</p>
            </fn>
            <fn id="table6fn14">
              <p><sup>n</sup>EXP LAP: exploratory laparotomy.</p>
            </fn>
            <fn id="table6fn15">
              <p><sup>o</sup>cath: catheter.</p>
            </fn>
            <fn id="table6fn16">
              <p><sup>p</sup>UPPP: uvulopalatopharyngoplasty.</p>
            </fn>
            <fn id="table6fn17">
              <p><sup>q</sup>ESRD, end-stage renal disease.</p>
            </fn>
            <fn id="table6fn18">
              <p><sup>r</sup>HD: hemodialysis.</p>
            </fn>
            <fn id="table6fn19">
              <p><sup>s</sup>perm cath: permanent catheter.</p>
            </fn>
            <fn id="table6fn20">
              <p><sup>t</sup>AVG: arteriovenous graft.</p>
            </fn>
            <fn id="table6fn21">
              <p><sup>u</sup>AVF: arteriovenous fistula.</p>
            </fn>
            <fn id="table6fn22">
              <p><sup>v</sup>PTA: percutaneous transluminal angioplasty.</p>
            </fn>
            <fn id="table6fn23">
              <p><sup>w</sup>RLL: right lower lobe.</p>
            </fn>
            <fn id="table6fn24">
              <p><sup>x</sup>NF: necrotizing fasciitis.</p>
            </fn>
            <fn id="table6fn25">
              <p><sup>y</sup>BK: below-knee amputation.</p>
            </fn>
            <fn id="table6fn26">
              <p><sup>z</sup>CCRT: concurrent chemoradiotherapy.</p>
            </fn>
            <fn id="table6fn27">
              <p><sup>aa</sup>VATS: video-assisted thoracic surgery.</p>
            </fn>
            <fn id="table6fn28">
              <p><sup>ab</sup>LAR: low anterior resection.</p>
            </fn>
            <fn id="table6fn29">
              <p><sup>ac</sup>ACL: anterior cruciate ligament.</p>
            </fn>
            <fn id="table6fn30">
              <p><sup>ad</sup>MCL: medial collateral ligament.</p>
            </fn>
            <fn id="table6fn31">
              <p><sup>ae</sup>ACDF: anterior cervical discectomy and fusion.</p>
            </fn>
            <fn id="table6fn32">
              <p><sup>af</sup>bil: bilateral.</p>
            </fn>
            <fn id="table6fn33">
              <p><sup>ag</sup>ov: ovarian.</p>
            </fn>
            <fn id="table6fn34">
              <p><sup>ah</sup>URSL: ureteroscopic lithotomy.</p>
            </fn>
            <fn id="table6fn35">
              <p><sup>ai</sup>TVOR: transvaginal oocyte retrieval.</p>
            </fn>
            <fn id="table6fn36">
              <p><sup>aj</sup>TCR: transcervical resectoscope.</p>
            </fn>
            <fn id="table6fn37">
              <p><sup>ak</sup>GA: gestational age.</p>
            </fn>
            <fn id="table6fn38">
              <p><sup>al</sup>rt: right.</p>
            </fn>
            <fn id="table6fn39">
              <p><sup>am</sup>MRI: magnetic resonance imaging.</p>
            </fn>
            <fn id="table6fn40">
              <p><sup>an</sup>TEP: total extraperitoneal approach.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The DNN-BERT model predicted the in-hospital 30-day mortality with the highest AUROC of 0.964 (95% CI 0.961-0.967) and an AUPRC of 0.336 (95% CI 0.276-0.402); see <xref ref-type="table" rid="table3">Table 3</xref> and <xref rid="figure3" ref-type="fig">Figure 3</xref>. The BERT-DNN had an AUROC significantly higher compared to XGBoost, logistic regression, and ASAPS but not the DNN or random forest. The BERT-DNN also had an AUPRC significantly higher compared to the DNN, random forest, XGBoost, logistic regression, and ASAPS.</p>
        <p>Hill et al [<xref ref-type="bibr" rid="ref6">6</xref>] proposed an ML model that outperformed previous tools (eg, preoperative score to predict postoperative mortality, Charlson comorbidity, and ASAPS) and could be used independently by clinicians. Our BERT-DNN model outperformed Hill et al’s [<xref ref-type="bibr" rid="ref6">6</xref>] model, obtaining a higher AUROC, sensitivity, and F1 score than their results (0.964, 95% CI 0.961-0.967 vs 0.932, 95% CI 0.910-0.951; 0.650, 95% CI 0.587-0.719 vs 0.239, 95% CI 0.127-0.379; and 0.347, 95% CI 0.305-0.388 vs 0.302, 95% CI 0.172-0.449, respectively); see <xref ref-type="table" rid="table3">Table 3</xref>. The preoperative diagnosis text features and proposed procedure information might contribute to our BERT-DNN model and enhance its sensitivity and F1 score. Unlike Hill et al [<xref ref-type="bibr" rid="ref6">6</xref>], who focused on patients undergoing general anesthesia, we trained and tested our model on both general and neuraxial anesthesia. The DL model with clinical text predicted postoperative mortality significantly more discriminatively than logistic regression and ASAPS (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
        <p>DL methods predict postoperative mortality using preoperative and intraoperative features [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Using a summary of intraoperative features alongside the ASAPS, Lee et al [<xref ref-type="bibr" rid="ref7">7</xref>] presented a DNN model that achieved an AUROC of 0.91 (95% CI 0.88-0.93). Our DNN model obtained a higher AUROC than their model because we included key features such as preoperative location and surgical department, the importance of which was also verified in previous studies [<xref ref-type="bibr" rid="ref6">6</xref>]. Fritz et al [<xref ref-type="bibr" rid="ref8">8</xref>] proposed a multipath convolutional neural network model to predict postoperative mortality using intraoperative time-series data and preoperative features. Their model achieved an AUROC of 0.910 (95% CI 0.897-0.924) and an AUPRC of 0.325 (95% CI 0.280-0.372) [<xref ref-type="bibr" rid="ref33">33</xref>]. In contrast, our model can be used preoperatively and achieve a higher AUROC and AUPRC (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
        <p>Previous studies used <italic>ICD</italic> and CPT codes as categorical features to stratify surgery risk [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. This input feature has many classes, which resulted in a sparse input matrix; this made it difficult for the model to learn helpful information. However, because <italic>ICD</italic> codes were typically recorded after surgery, including them in the preoperative model was impractical. Furthermore, the CPT code was not used globally. For this reason, we could not compare a model including word embeddings with one including CPT codes. However, our results exhibited excellent discrimination with a high AUROC and AUPRC. The AUPRC is significantly higher than models without text. The calibration plot also strongly correlated the predicted probabilities and observed mortalities (<xref rid="figure4" ref-type="fig">Figure 4</xref>). Word embedding visualizations showed that the increased predicted probabilities were concordant with high-risk surgery and an increased mortality rate (<xref rid="figure5" ref-type="fig">Figure 5</xref> and <xref ref-type="table" rid="table6">Table 6</xref>). We showed that word embeddings for surgery information could be used in DL models to predict postoperative mortality before surgery without requiring CPT or <italic>ICD</italic> codes.</p>
        <p>The fusion of neural networks, combining diverse types of data (eg, image [<xref ref-type="bibr" rid="ref34">34</xref>] and time-series [<xref ref-type="bibr" rid="ref8">8</xref>] data) with 1D data (eg, categorical, and continuous data), improved the model’s performance. Including unstructured clinical text via natural language procession can improve intensive care unit (ICU) mortality predictions [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. The DL model that combined unstructured and structured data outperformed models using either type of data alone [<xref ref-type="bibr" rid="ref15">15</xref>]. Moreover, the performance of the clinical pretrained DL language model could be maintained between different institutions [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has several limitations. First, postoperative mortality accounted for 1.3% (1562/121,313) of our cohort, and the classes were highly imbalanced. The model training and performance metric evaluations were difficult to apply with these sparse positive labels. To compensate for the class imbalance via an algorithmic method, we applied cost-sensitive learning by balancing the weights of the loss function to emphasize the minority group [<xref ref-type="bibr" rid="ref36">36</xref>]. We evaluated the discrimination of our model with the AUPRC, which is more informative than the AUROC for imbalanced data [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Second, our model predicted mortality using EHRs. The errors in the records and missing values affected the prediction results. Typos of text interfered with the word-embedding process. Outliers were detected and input using the defined rules (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Third, all records were collected from a single large medical center. Although the pipeline we created ensured that the DL model could be reproduced in other institutes, the model weights might vary for a different data set. The generalizability of our results must be examined in future studies.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>In conclusion, descriptive surgical text was essential for predicting postoperative mortality. The word embeddings of preoperative diagnoses and proposed procedures, via the contextualized language model BERT, were combined in DL models to predict postoperative mortality. This predictive capacity can help identify patients with higher risk from structure data and text of EHRs.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Summary of laboratory values and vital sign values.</p>
        <media xlink:href="medinform_v10i5e38241_app1.doc" xlink:title="DOC File , 45 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Continuous feature limits to define outliers.</p>
        <media xlink:href="medinform_v10i5e38241_app2.doc" xlink:title="DOC File , 33 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Higher resolution of <xref rid="figure5" ref-type="fig">Figure 5</xref>. Word embeddings visualized by t distributed stochastic neighbor embedding. (A) Word embeddings of the training set. (B) Word embeddings of the testing set. “Probs” indicates probabilities predicated by the BERT-DNN model. The intensity of color increased with the probability. “Labels” indicates mortalities by “x” and survivors by “•”. ards: acute respiratory distress syndrome; atfl: anterior talofibular ligament; avg: arteriovenous graft; avp: aortic valvuloplasty; BERT: bidirectional encoder representations from transformers; bct: breast-conserving therapy; bil: bilateral; bph: benign prostate hypertrophy; bx: biopsy; chr: chronic hypertrophic rhinitis; cps: chronic paranasal sinusitis; dbj: double J stent; DNN: deep neural network; ecmo: extracorporeal membrane oxygenation; emh: endometrial hemorrhage; esrd: end-stage renal disease; fess: functional endoscopic sinus surgery; itc: intertrochanter; ivg: intravenous general anesthesia; lih: left inguinal hernia; mvr: mitral valve replacement; nsd: nasal septum deviation; p: post; pcnl: percutaneous nephrolithotomy; perm cath: permanent catheter; psa: prostate-specific antigen; r: rule out; r’t: right; rirs: retrograde intrarenal surgery; rv: right ventricle; slnd: sentinel lymph node dissection; SNE: stochastic neighbor embedding; t colon: transverse colon; tee: transesophageal echocardiography; tep: total extraperitoneal approach; trus: transrectal ultrasound; turp: transurethral resection of the prostate; urs: ureteroscopy; vats: video-assisted thoracic surgery; vhd: valvular heart disease.</p>
        <media xlink:href="medinform_v10i5e38241_app3.png" xlink:title="PNG File , 5102 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ASAPS</term>
          <def>
            <p>American Society of Anesthesiologist Physical Status</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUPRC</term>
          <def>
            <p>area under the precision-recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUROC</term>
          <def>
            <p>area under the receiver operator characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BERT</term>
          <def>
            <p>bidirectional encoder representations from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CPT</term>
          <def>
            <p>Current Procedural Terminology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DL</term>
          <def>
            <p>deep learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">DNN</term>
          <def>
            <p>deep neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">FC</term>
          <def>
            <p>fully connected</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Ministry of Science and Technology, Taiwan (Grant MOST 110-2634-F-002-032-), and the Far Eastern Memorial Hospital, Taiwan (Grant FEMH-2021-C-056). The sponsors had no role in the study design, data collection and analysis, publication decision, or manuscript drafting. All authors have approved the final article.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>International Surgical Outcomes Study Group</collab>
          </person-group>
          <article-title>Global patient outcomes after elective surgery: prospective cohort study in 27 low-, middle- and high-income countries</article-title>
          <source>Br J Anaesth</source>
          <year>2016</year>
          <month>10</month>
          <day>31</day>
          <volume>117</volume>
          <issue>5</issue>
          <fpage>601</fpage>
          <lpage>609</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0007-0912(17)30018-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bja/aew316</pub-id>
          <pub-id pub-id-type="medline">27799174</pub-id>
          <pub-id pub-id-type="pii">S0007-0912(17)30018-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC5091334</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sigakis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bittner</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wanderer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Validation of a risk stratification index and risk quantification index for predicting patient outcomes: in-hospital mortality, 30-day mortality, 1-year mortality, and length-of-stay</article-title>
          <source>Anesthesiology</source>
          <year>2013</year>
          <month>09</month>
          <volume>119</volume>
          <issue>3</issue>
          <fpage>525</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubs.asahq.org/anesthesiology/article-lookup/doi/10.1097/ALN.0b013e31829ce6e6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ALN.0b013e31829ce6e6</pub-id>
          <pub-id pub-id-type="medline">23770598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Le Manach</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rodseth</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Le Bihan-Benjamin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Biccard</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Riou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Devereaux</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Landais</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Preoperative Score to Predict Postoperative Mortality (POSPOM): derivation and validation</article-title>
          <source>Anesthesiology</source>
          <year>2016</year>
          <month>03</month>
          <volume>124</volume>
          <issue>3</issue>
          <fpage>570</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubs.asahq.org/anesthesiology/article-lookup/doi/10.1097/ALN.0000000000000972"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ALN.0000000000000972</pub-id>
          <pub-id pub-id-type="medline">26655494</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayhew</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mendonca</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Murthy</surname>
              <given-names>BVS</given-names>
            </name>
          </person-group>
          <article-title>A review of ASA physical status: historical perspectives and modern developments</article-title>
          <source>Anaesthesia</source>
          <year>2019</year>
          <month>03</month>
          <day>15</day>
          <volume>74</volume>
          <issue>3</issue>
          <fpage>373</fpage>
          <lpage>379</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/anae.14569"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/anae.14569</pub-id>
          <pub-id pub-id-type="medline">30648259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bilimoria</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Paruch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kmiecik</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Development and evaluation of the universal ACS NSQIP surgical risk calculator: a decision aid and informed consent tool for patients and surgeons</article-title>
          <source>J Am Coll Surg</source>
          <year>2013</year>
          <month>11</month>
          <volume>217</volume>
          <issue>5</issue>
          <fpage>833</fpage>
          <lpage>42.e1</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24055383"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jamcollsurg.2013.07.385</pub-id>
          <pub-id pub-id-type="medline">24055383</pub-id>
          <pub-id pub-id-type="pii">S1072-7515(13)00894-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC3805776</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gabel</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rakocz</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cannesson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baldi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Olde Loohuis</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jew</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Maoz</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sankararaman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hofer</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Halperin</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>An automated machine learning-based model predicts postoperative mortality using readily-extractable preoperative electronic health record data</article-title>
          <source>Br J Anaesth</source>
          <year>2019</year>
          <month>12</month>
          <volume>123</volume>
          <issue>6</issue>
          <fpage>877</fpage>
          <lpage>886</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0007-0912(19)30646-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.bja.2019.07.030</pub-id>
          <pub-id pub-id-type="medline">31627890</pub-id>
          <pub-id pub-id-type="pii">S0007-0912(19)30646-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6883494</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Hofer</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gabel</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Baldi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cannesson</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a deep neural network model for prediction of postoperative in-hospital mortality</article-title>
          <source>Anesthesiology</source>
          <year>2018</year>
          <month>10</month>
          <volume>129</volume>
          <issue>4</issue>
          <fpage>649</fpage>
          <lpage>662</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubs.asahq.org/anesthesiology/article-lookup/doi/10.1097/ALN.0000000000002186"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ALN.0000000000002186</pub-id>
          <pub-id pub-id-type="medline">29664888</pub-id>
          <pub-id pub-id-type="pmcid">PMC6148401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kronzer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ben Abdallah</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Avidan</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Deep-learning model for predicting 30-day postoperative mortality</article-title>
          <source>Br J Anaesth</source>
          <year>2019</year>
          <month>11</month>
          <volume>123</volume>
          <issue>5</issue>
          <fpage>688</fpage>
          <lpage>695</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0007-0912(19)30636-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.bja.2019.07.025</pub-id>
          <pub-id pub-id-type="medline">31558311</pub-id>
          <pub-id pub-id-type="pii">S0007-0912(19)30636-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6993109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Goldsmith</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mohan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Turnbull</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Freundlich</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Billings</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kiran</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Impact of intraoperative data on risk prediction for mortality after intra-abdominal surgery</article-title>
          <source>Anesth Analg</source>
          <year>2022</year>
          <month>01</month>
          <day>01</day>
          <volume>134</volume>
          <issue>1</issue>
          <fpage>102</fpage>
          <lpage>113</lpage>
          <pub-id pub-id-type="doi">10.1213/ANE.0000000000005694</pub-id>
          <pub-id pub-id-type="medline">34908548</pub-id>
          <pub-id pub-id-type="pii">00000539-202201000-00016</pub-id>
          <pub-id pub-id-type="pmcid">PMC8682663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Konishi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Goto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fujiogi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Michihata</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kumazawa</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Matsui</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fushimi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tanabe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Seto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yasunaga</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>New machine learning scoring system for predicting postoperative mortality in gastroduodenal ulcer perforation: a study using a Japanese nationwide inpatient database</article-title>
          <source>Surgery</source>
          <year>2022</year>
          <month>04</month>
          <volume>171</volume>
          <issue>4</issue>
          <fpage>1036</fpage>
          <lpage>1042</lpage>
          <pub-id pub-id-type="doi">10.1016/j.surg.2021.08.031</pub-id>
          <pub-id pub-id-type="medline">34538648</pub-id>
          <pub-id pub-id-type="pii">S0039-6060(21)00846-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Janjua</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>DeSantis</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Grimsley</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pietrobon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>PC</given-names>
            </name>
          </person-group>
          <article-title>Machine learning refinement of the NSQIP risk calculator: who survives the "Hail Mary" case?</article-title>
          <source>J Am Coll Surg</source>
          <year>2022</year>
          <month>04</month>
          <day>01</day>
          <volume>234</volume>
          <issue>4</issue>
          <fpage>652</fpage>
          <lpage>659</lpage>
          <pub-id pub-id-type="doi">10.1097/XCS.0000000000000108</pub-id>
          <pub-id pub-id-type="medline">35290285</pub-id>
          <pub-id pub-id-type="pii">00019464-202204000-00029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dalton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kurz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Turan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mascha</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sessler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Saager</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a risk quantification index for 30-day postoperative mortality and morbidity in noncardiac surgical patients</article-title>
          <source>Anesthesiology</source>
          <year>2011</year>
          <month>06</month>
          <volume>114</volume>
          <issue>6</issue>
          <fpage>1336</fpage>
          <lpage>44</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubs.asahq.org/anesthesiology/article-lookup/doi/10.1097/ALN.0b013e318219d5f9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ALN.0b013e318219d5f9</pub-id>
          <pub-id pub-id-type="medline">21519230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hashimoto</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Witkowski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Meireles</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rosman</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in anesthesiology: current techniques, clinical applications, and limitations</article-title>
          <source>Anesthesiology</source>
          <year>2020</year>
          <month>02</month>
          <volume>132</volume>
          <issue>2</issue>
          <fpage>379</fpage>
          <lpage>394</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubs.asahq.org/anesthesiology/article-lookup/doi/10.1097/ALN.0000000000002960"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ALN.0000000000002960</pub-id>
          <pub-id pub-id-type="medline">31939856</pub-id>
          <pub-id pub-id-type="pii">00000542-202002000-00027</pub-id>
          <pub-id pub-id-type="pmcid">PMC7643051</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Hubbard</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Harhay</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Himes</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Inclusion of unstructured clinical text improves early prediction of death or prolonged ICU stay</article-title>
          <source>Crit Care Med</source>
          <year>2018</year>
          <month>07</month>
          <volume>46</volume>
          <issue>7</issue>
          <fpage>1125</fpage>
          <lpage>1132</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29629986"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/CCM.0000000000003148</pub-id>
          <pub-id pub-id-type="medline">29629986</pub-id>
          <pub-id pub-id-type="pmcid">PMC6005735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Combining structured and unstructured data for predictive models: a deep learning approach</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>10</month>
          <day>29</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>280</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-01297-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-01297-6</pub-id>
          <pub-id pub-id-type="medline">33121479</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-01297-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7596962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marafino</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Thombley</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Luft</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Sing</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Kazi</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>DeJong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Boscardin</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Validation of prediction models for critical care outcomes using natural language processing of electronic health record data</article-title>
          <source>JAMA Netw Open</source>
          <year>2018</year>
          <month>12</month>
          <day>07</day>
          <volume>1</volume>
          <issue>8</issue>
          <fpage>e185097</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jamanetwork.com/journals/jamanetworkopen/fullarticle/10.1001/jamanetworkopen.2018.5097"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2018.5097</pub-id>
          <pub-id pub-id-type="medline">30646310</pub-id>
          <pub-id pub-id-type="pii">2719128</pub-id>
          <pub-id pub-id-type="pmcid">PMC6324323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Bert: Pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv preprint</source>
          <year>2018</year>
          <month>10</month>
          <day>11</day>
          <pub-id pub-id-type="doi">10.48550/arXiv.1810.04805</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <collab>Arnaud</collab>
            <name name-style="western">
              <surname>Elbattah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gignon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dequen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Learning embeddings from free-text triage notes using pretrained transformer models</article-title>
          <year>2022</year>
          <conf-name>Proceedings of the 15th International Joint Conference on Biomedical Engineering Systems and Technologies - Scale-IT-up</conf-name>
          <conf-date>2022</conf-date>
          <conf-loc>Vienna</conf-loc>
          <fpage>835</fpage>
          <pub-id pub-id-type="doi">10.5220/0011012800003123</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kades</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sellner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koehler</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Full</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>TYE</given-names>
            </name>
            <name name-style="western">
              <surname>Kleesiek</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Maier-Hein</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Adapting bidirectional encoder representations from transformers (BERT) to assess clinical semantic textual similarity: algorithm development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>02</month>
          <day>03</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e22795</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/2/e22795/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22795</pub-id>
          <pub-id pub-id-type="medline">33533728</pub-id>
          <pub-id pub-id-type="pii">v9i2e22795</pub-id>
          <pub-id pub-id-type="pmcid">PMC7889424</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Nltk: The natural language toolkit</article-title>
          <source>arXiv</source>
          <year>2002</year>
          <month>05</month>
          <day>17</day>
          <pub-id pub-id-type="doi">10.48550/arXiv.cs/0205028</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Random forests</article-title>
          <source>Mach Learn</source>
          <year>2001</year>
          <month>10</month>
          <volume>45</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Xgboost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <month>08</month>
          <conf-name>Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: Synthetic Minority Over-sampling Technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alsentzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Publicly available clinical BERT embeddings</article-title>
          <source>arXiv</source>
          <year>2019</year>
          <month>04</month>
          <day>06</day>
          <pub-id pub-id-type="doi">10.18653/v1/w19-1909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saito</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rehmsmeier</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <month>3</month>
          <day>4</day>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>e0118432</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0118432"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0118432</pub-id>
          <pub-id pub-id-type="medline">25738806</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-26790</pub-id>
          <pub-id pub-id-type="pmcid">PMC4349800</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ozenne</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Subtil</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Maucort-Boulch</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The precision-recall curve overcame the optimism of the receiver operating characteristic curve in rare diseases</article-title>
          <source>J Clin Epidemiol</source>
          <year>2015</year>
          <month>08</month>
          <volume>68</volume>
          <issue>8</issue>
          <fpage>855</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.jclinepi.2015.02.010"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2015.02.010</pub-id>
          <pub-id pub-id-type="medline">25881487</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(15)00106-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>DeLong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>DeLong</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke-Pearson</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comparing the areas under two or more correlated receiver operating characteristic curves: a nonparametric approach</article-title>
          <source>Biometrics</source>
          <year>1988</year>
          <month>09</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>837</fpage>
          <pub-id pub-id-type="doi">10.2307/2531595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Eng</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Page</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Blockeel</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kersting</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nijssen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Železný</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Area under the precision-recall curve: point estimates and confidence intervals</article-title>
          <source>Machine Learning and Knowledge Discovery in Databases</source>
          <year>2013</year>
          <publisher-loc>Berlin, Heidelberg</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>451</fpage>
          <lpage>466</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maaten</surname>
              <given-names>LVD</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Visualizing data using t-SNE</article-title>
          <source>J Mach Learn Res</source>
          <year>2008</year>
          <volume>9</volume>
          <fpage>2579</fpage>
          <lpage>2605</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bahadori</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Colak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celikkaya</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bhakta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Senthivel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khalilia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Navarro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Improving hospital mortality prediction with medical named entities and multimodal learning</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <month>11</month>
          <day>29</day>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kossaifi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brucher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>É</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <month>02</month>
          <day>01</day>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bradbury</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chanan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Killeen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gimelshein</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Antiga</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Pytorch: an imperative style, high-performance deep learning library</article-title>
          <year>2019</year>
          <conf-name>33rd Conference on Neural Information Processing Systems (NeurIPS)</conf-name>
          <conf-date>Dec 8-14, 2019</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <fpage>A</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelhack</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Avidan</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Update to 'Deep-learning model for predicting 30-day postoperative mortality' (Br J Anaesth 2019; 123: 688-95)</article-title>
          <source>Br J Anaesth</source>
          <year>2020</year>
          <month>08</month>
          <volume>125</volume>
          <issue>2</issue>
          <fpage>e230</fpage>
          <lpage>e231</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0007-0912(20)30222-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.bja.2020.04.010</pub-id>
          <pub-id pub-id-type="medline">32389391</pub-id>
          <pub-id pub-id-type="pii">S0007-0912(20)30222-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7844347</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pareek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Seyyedi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lungren</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Fusion of medical imaging and electronic health records using deep learning: a systematic review and implementation guidelines</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <month>10</month>
          <day>16</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>136</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-020-00341-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-00341-z</pub-id>
          <pub-id pub-id-type="medline">33083571</pub-id>
          <pub-id pub-id-type="pii">341</pub-id>
          <pub-id pub-id-type="pmcid">PMC7567861</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bear Don't Walk Iv</surname>
              <given-names>OJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Perotte</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Clinically relevant pretraining is all you need</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>08</month>
          <day>13</day>
          <volume>28</volume>
          <issue>9</issue>
          <fpage>1970</fpage>
          <lpage>1976</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab086</pub-id>
          <pub-id pub-id-type="medline">34151966</pub-id>
          <pub-id pub-id-type="pii">6307175</pub-id>
          <pub-id pub-id-type="pmcid">PMC8363791</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Khoshgoftaar</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>Survey on deep learning with class imbalance</article-title>
          <source>J Big Data</source>
          <year>2019</year>
          <month>3</month>
          <day>19</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1186/s40537-019-0192-5</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
