<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn></journal-meta><article-meta><article-id pub-id-type="publisher-id">50642</article-id><article-id pub-id-type="doi">10.2196/50642</article-id><title-group><article-title>Predicting Hypoxia Using Machine Learning: Systematic Review</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Pigat</surname><given-names>Lena</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Geisler</surname><given-names>Benjamin P</given-names></name><degrees>MD, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sheikhalishahi</surname><given-names>Seyedmostafa</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sander</surname><given-names>Julia</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kaspar</surname><given-names>Mathias</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Schmutz</surname><given-names>Maximilian</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rohr</surname><given-names>Sven Olaf</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wild</surname><given-names>Carl Mathis</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Goss</surname><given-names>Sebastian</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zaghdoudi</surname><given-names>Sarra</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hinske</surname><given-names>Ludwig Christian</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Digital Medicine, University Hospital of Augsburg</institution>, <addr-line>Augsburg</addr-line>, <country>Germany</country></aff><aff id="aff2"><institution>Hematology and Oncology, University Hospital of Augsburg</institution>, <addr-line>Augsburg</addr-line>, <country>Germany</country></aff><aff id="aff3"><institution>Gynecology and Obstetrics, University Hospital of Augsburg</institution>, <addr-line>Augsburg</addr-line>, <country>Germany</country></aff><aff id="aff4"><institution>Department of Anaesthesiology, LMU University Hospital, LMU Munich</institution>, <addr-line>Munich</addr-line>, <country>Germany</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Price</surname><given-names>Carrie</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Maharjan</surname><given-names>Jenish</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Lena Pigat, MPH<email>lena.pigat@uk-augsburg.de</email></corresp></author-notes><pub-date pub-type="collection"><year>2024</year></pub-date><pub-date pub-type="epub"><day>2</day><month>2</month><year>2024</year></pub-date><volume>12</volume><elocation-id>e50642</elocation-id><history><date date-type="received"><day>17</day><month>07</month><year>2023</year></date><date date-type="rev-recd"><day>02</day><month>11</month><year>2023</year></date><date date-type="accepted"><day>05</day><month>11</month><year>2023</year></date></history><copyright-statement>&#x00A9; Lena Pigat, Benjamin P Geisler, Seyedmostafa Sheikhalishahi, Julia Sander, Mathias Kaspar, Maximilian Schmutz, Sven Olaf Rohr, Carl Mathis Wild, Sebastian Goss, Sarra Zaghdoudi, Ludwig Christian Hinske. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 2.2.2024. </copyright-statement><copyright-year>2024</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2024/1/e50642"/><abstract><sec><title>Background</title><p>Hypoxia is an important risk factor and indicator for the declining health of inpatients. Predicting future hypoxic events using machine learning is a prospective area of study to facilitate time-critical interventions to counter patient health deterioration.</p></sec><sec><title>Objective</title><p>This systematic review aims to summarize and compare previous efforts to predict hypoxic events in the hospital setting using machine learning with respect to their methodology, predictive performance, and assessed population.</p></sec><sec sec-type="methods"><title>Methods</title><p>A systematic literature search was performed using Web of Science, Ovid with Embase and MEDLINE, and Google Scholar. Studies that investigated hypoxia or hypoxemia of hospitalized patients using machine learning models were considered. Risk of bias was assessed using the Prediction Model Risk of Bias Assessment Tool.</p></sec><sec sec-type="results"><title>Results</title><p>After screening, a total of 12 papers were eligible for analysis, from which 32 models were extracted. The included studies showed a variety of population, methodology, and outcome definition. Comparability was further limited due to unclear or high risk of bias for most studies (10/12, 83%). The overall predictive performance ranged from moderate to high. Based on classification metrics, deep learning models performed similar to or outperformed conventional machine learning models within the same studies. Models using only prior peripheral oxygen saturation as a clinical variable showed better performance than models based on multiple variables, with most of these studies (2/3, 67%) using a long short-term memory algorithm.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Machine learning models provide the potential to accurately predict the occurrence of hypoxic events based on retrospective data. The heterogeneity of the studies and limited generalizability of their results highlight the need for further validation studies to assess their predictive performance.</p></sec><sec><title>Trial Registration</title><p>PROSPERO CRD42023381710; <ext-link ext-link-type="uri" xlink:href="https://www.crd.york.ac.uk/prospero/display_record.php?RecordID=381710">https://www.crd.york.ac.uk/prospero/display_record.php?RecordID=381710</ext-link></p></sec></abstract><kwd-group><kwd>artificial intelligence</kwd><kwd>machine learning</kwd><kwd>hypoxia</kwd><kwd>hypoxemia</kwd><kwd>anoxia</kwd><kwd>hypoxic</kwd><kwd>deterioration</kwd><kwd>oxygen</kwd><kwd>prediction</kwd><kwd>systematic review</kwd><kwd>review methods</kwd><kwd>review methodology</kwd><kwd>systematic</kwd><kwd>hospital</kwd><kwd>predict</kwd><kwd>prediction</kwd><kwd>predictive</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>A key factor in risk assessment for sequelae and mortality in hospitalized patients is hypoxia. It describes the decreased availability of oxygen in specific body regions (tissue hypoxia) or in the body as a whole (general hypoxia) [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. To prevent general hypoxia and to detect deterioration quickly, hypoxemia monitoring is commonly performed using pulse oximetry as a continuous and noninvasive assessment, especially in the intensive care unit (ICU) and operating room (OR) [<xref ref-type="bibr" rid="ref4">4</xref>]. Hypoxemia is defined as an abnormally low level of blood oxygen. In addition to pulse oximetry, it can be assessed through an arterial blood gas analysis or imaging techniques, which can additionally serve as reliable indicators of subsequent tissue damage [<xref ref-type="bibr" rid="ref3">3</xref>]. A multinational, multicenter study including 117 ICUs found a hypoxemia prevalence of more than 50% among all ICU patients [<xref ref-type="bibr" rid="ref5">5</xref>]. The severity of hypoxemia was shown to be a direct risk factor for mortality in patients with hypoxemia. Being able to validly assess the individual risk of future hypoxemic and ultimately hypoxic events is therefore highly relevant.</p><p>To determine the risk or stage of a disease, artificial intelligence (AI) has been increasingly introduced into clinical routine in recent years to exploit underlying causal mechanisms that may not be accessible to humans. As a prime example, machine learning (ML) as a discipline of AI is being successfully used for cancer tissue classification in medical imaging [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. ML is also already being applied for prognostic purposes, for example, in the examination of patient characteristics to identify an increased risk of deterioration tendencies such as atrial fibrillation and of developing sequelae of diabetes mellitus or hereditary diseases [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Efforts to date of using ML to predict hypoxic events are being conducted in a variety of settings and demonstrate diverse approaches and methodologies. Studies differ significantly in terms of the patient population assessed, definition of prediction outcome, features used to predict hypoxia, and ML algorithms used, thus increasing the difficulty to generalize the conclusions of individual studies. It is therefore challenging to compare and evaluate these studies comprehensively.</p><p>This review aimed to provide a systematic and structured overview of the existing approaches to predict hypoxic events in the hospital setting. Our specific objectives were to summarize the different populations, model details, and prediction performance to capture the current state of available models; identify gaps and limitations; highlight promising approaches and methodologies; and provide guidance for future research in this area.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Protocol</title><p>This review was reported in accordance with the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) statement (<xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>) [<xref ref-type="bibr" rid="ref11">11</xref>]. The protocol was registered in the International Prospective Register of Systematic Reviews (PROSPERO) prior to data extraction (reference CRD42023381710).</p></sec><sec id="s2-2"><title>Search Strategy</title><p>Relevant literature was searched for using Ovid with Embase and MEDLINE, Web of Science, and Google Scholar. Although the prior 2 databases were searched via their web query interface, Google Scholar was searched using the software Publish or Perish, as it allows for more complex queries [<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>Publications on the topic of hypoxia prediction using ML were searched by creating 2 sets of search terms, with the first set addressing hypoxia (including hypoxemia) and the second set addressing ML. With the identified search engines, the intersection of these 2 groups was then searched for, adjusting the syntax according to the search logic of the respective search engine. If Medical Subject Headings or thesaurus entries were available, the selected terms were included in the search logic accordingly. For the searches using Ovid and Web of Science, the search results were filtered to only include studies that did not use wearables for data collection and that were published in the English and German languages. Those filters were not applicable for the search of Google Scholar using Publish or Perish.</p><p>The selection and deduplication process was performed using Covidence (Veritas Health Innovation Ltd), with undetected duplicates removed by hand [<xref ref-type="bibr" rid="ref13">13</xref>]. The search results of all databases were included, and duplicates were removed. The abstracts of the remaining results were independently screened by 2 reviewers. Results that met the selection criteria were reviewed in their entirety for the assessment of eligibility by 2 reviewers. In addition, references of the included studies were also screened for studies that meet the inclusion criteria and were subsequently included where appropriate. The search strategy was developed by 1 team member and reviewed by another with expertise in conducting systematic reviews. The detailed search strategy can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-3"><title>Selection Criteria</title><p>Primary outcomes were model features, definition of the prediction end point, and predictive performance. Studies developing ML models to predict hypoxia or hypoxemia in continuously monitored human inpatients were included. Both studies of patients who were mechanically ventilated and spontaneously breathing were included. Hypoxia could be a main outcome or an auxiliary goal.</p><p>Studies that assessed hypoxia only in specific tissues were excluded, as this review addresses the prediction of general hypoxia as an important indicator of critical illness for risk stratification and early detection of patients at risk of acute health deterioration. Additionally, studies focusing on a population &#x003C;18 years of age were not included, since the distinct etiologies, risk factors, and clinical presentations of hypoxia in pediatric patients may limit the generalizability of the findings to the population of adult inpatients.</p><p>The definition of the end point of hypoxia prediction (eg, specific oximetry thresholds or time frames of prediction) was left unspecified due to the expected heterogeneity in the approaches. The patient population of the included studies was not limited to a specific hospital setting or ward.</p></sec><sec id="s2-4"><title>Data Extraction and Risk of Bias</title><p>Data extracted included the data source; sample size and setting; model variables; prediction end point and time frame; type of model; and the predictive performance of each model, usually expressed as classification measures such as sensitivity, specificity, positive predictive value (PPV), negative predictive value (NPV), or area under the receiver operating characteristics (AUROC). Missing values of performance measures and summary data influenced the risk-of-bias assessment.</p><p>A qualitative synthesis of the included studies was conducted. For this purpose, an overview of all studies was provided in a narrative summary by categorizing them into subgroups based on the population, model features, model types, and setting. For each study, the model with the highest performance according to performance metrics was selected to summarize AUROC, sensitivity, specificity, PPV, and NPV as the most reported performance measures. In the case of studies that examined multiple prediction outcomes, the outcome definition that is the most similar to those of the other studies was chosen for reporting. For studies reporting 1 performance value per patient, a mean value was calculated for each measure. Because of the heterogeneous study designs and characteristics of the data used, as well as missing summary data of model performances, conducting a meta-analysis was not feasible.</p><p>To assess the risk of bias, quality, and applicability of the studies included, Prediction Model Risk of Bias Assessment Tool (PROBAST) was used [<xref ref-type="bibr" rid="ref14">14</xref>]. This tool is specifically designed to investigate the quality of prediction models and has become increasingly prevalent in systematic reviews in recent years. Assessment outcomes were evaluated based on 4 segments&#x2014;participants, predictors, outcome, and analysis&#x2014;and were determined by a comprehensive questionnaire. Risk of bias was rated as high, low, or unclear. If 1 domain suggested a high risk of bias, the overall risk of bias for that study was considered high. The assessment was conducted by a single researcher, with a second researcher reviewing the process independently.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Literature Search</title><p>The initial search retrieved a total of 3734 studies (<xref ref-type="fig" rid="figure1">Figure 1</xref>). After removing a total of 700 duplicates, title and abstract screening identified the full texts of 31 studies for the assessment of eligibility. Of these, 19 studies were excluded due to not being a full study (n=6), not assessing a hypoxia outcome (n=4), not using machine learning (n=3), inability to obtain the full text (n=2), having an outpatient setting (n=2), having a pediatric patient population (n=1), and being in the Chinese language (n=1). The remaining 12 studies were included in the review.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e50642_fig01.png"/></fig></sec><sec id="s3-2"><title>Study Characteristics</title><sec id="s3-2-1"><title>Overview</title><p><xref ref-type="table" rid="table1">Table 1</xref> presents the characteristics of all included studies and gives an overview of the best-performing model in each study, divided into conventional ML and deep learning models for studies including both. The studies were conducted in the United States [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref22">22</xref>], China [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], Germany [<xref ref-type="bibr" rid="ref25">25</xref>], and the United Arab Emirates [<xref ref-type="bibr" rid="ref26">26</xref>]. Half (6/12, 50%) of them were published after 2020 [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. In 3 (25%) of the 12 studies, the prediction of hypoxia was a side or auxiliary goal [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], whereas it was the main study aim for the other studies.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Study characteristics of the reviewed studies (n=12). The model with the highest performance in each study is reported. For studies using both conventional machine learning and deep learning models, each best-performing model is reported. For studies examining multiple prediction outcomes, the outcome definition that is the most similar to those of other studies was chosen for reporting. For studies reporting 1 performance value per patient, a mean value was calculated.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Reference</td><td align="left" valign="bottom">Sample size n</td><td align="left" valign="bottom">Clinical variables, n</td><td align="left" valign="bottom">Prediction end point</td><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Performance</td><td align="left" valign="bottom">External validation</td></tr></thead><tbody><tr><td align="left" valign="top">Annapragada et al [<xref ref-type="bibr" rid="ref15">15</xref>] (2021)</td><td align="left" valign="top">2435</td><td align="left" valign="top">1</td><td align="left" valign="top">SpO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> &#x003C;92% within the next 5 and 30 min (occurrence and magnitude of hypoxemic events)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>LSTM<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>PPV<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup>: 0.94</p></list-item><list-item><p>Sensitivity: 0.80</p></list-item><list-item><p>Specificity: 0.99</p></list-item></list></td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">Chen et al [<xref ref-type="bibr" rid="ref16">16</xref>] (2021)</td><td align="left" valign="top">57,171</td><td align="left" valign="top">21</td><td align="left" valign="top">SaO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup> &#x003C;93% within the next 5 min</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>GBT<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup>: 0.89</p></list-item></list></td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">ElMoaqet et al [<xref ref-type="bibr" rid="ref17">17</xref>] (2014)</td><td align="left" valign="top">119</td><td align="left" valign="top">1</td><td align="left" valign="top">SpO<sub>2</sub> &#x2264;89% within the next 20 and 60 s</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Lin<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC: 0.93</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Erion et al [<xref ref-type="bibr" rid="ref18">18</xref>] (2017)</td><td align="left" valign="top">57,173</td><td align="left" valign="top">1</td><td align="left" valign="top">SpO<sub>2</sub> &#x2264;92% within the next 5 min</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>LSTM</p></list-item><list-item><p>GBT</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>LSTM AUROC: 0.87</p></list-item><list-item><p>GBT AUROC: 0.86</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Geng et al [<xref ref-type="bibr" rid="ref23">23</xref>] (2018)</td><td align="left" valign="top">308</td><td align="left" valign="top">3</td><td align="left" valign="top">SpO<sub>2</sub> &#x003C;90% for any duration during the endoscopic procedure</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>LR<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC: 0.76</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Geng et al [<xref ref-type="bibr" rid="ref24">24</xref>] (2019)</td><td align="left" valign="top">220</td><td align="left" valign="top">3</td><td align="left" valign="top">SpO<sub>2</sub> &#x003C;90% for any duration during the endoscopy procedure</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>ANN<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC: 0.80</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Lam et al [<xref ref-type="bibr" rid="ref19">19</xref>] (2022)</td><td align="left" valign="top">39,630</td><td align="left" valign="top">26</td><td align="left" valign="top">SpO<sub>2</sub> &#x003C;91% and &#x003C;96% after algorithm evaluation and any time during hospitalization</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>XGB<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></p></list-item><list-item><p>RNN<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>XGB AUROC: 0.64</p></list-item><list-item><p>RNN AUROC: 0.64</p></list-item></list></td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">Lundberg et al [<xref ref-type="bibr" rid="ref20">20</xref>] (2018)</td><td align="left" valign="top">36,232</td><td align="left" valign="top">&#x003E;65</td><td align="left" valign="top">SpO<sub>2</sub> &#x2264;92% initial status and within the next 5 min</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>GBM<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC: 0.90</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Ren et al [<xref ref-type="bibr" rid="ref21">21</xref>] (2022)</td><td align="left" valign="top">17,818</td><td align="left" valign="top">3</td><td align="left" valign="top">PaO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup>/FiO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup> &#x2264;150 at any time during ventilation</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>NN<sup><xref ref-type="table-fn" rid="table1fn15">o</xref></sup></p></list-item><list-item><p>LR</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>NN AUROC: 0.83</p></list-item><list-item><p>LR AUROC: 0.81</p></list-item></list></td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">Sippl et al [<xref ref-type="bibr" rid="ref25">25</xref>] (2017)</td><td align="left" valign="top">620</td><td align="left" valign="top">17, RF<sup><xref ref-type="table-fn" rid="table1fn16">p</xref></sup> and NN used subsets of 6 and 7</td><td align="left" valign="top">Presence and severity of temporary oxygen desaturation during anesthesia induction and intubation based on expert annotations</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>NN</p></list-item><list-item><p>RF</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>NN sensitivity: 0.74</p></list-item><list-item><p>NN specificity: 0.93</p></list-item><list-item><p>RF sensitivity: 0.35</p></list-item><list-item><p>RF specificity: 0.99</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Statsenko et al [<xref ref-type="bibr" rid="ref26">26</xref>] (2022)</td><td align="left" valign="top">605</td><td align="left" valign="top">2D and 3D diagnostic images of the chest</td><td align="left" valign="top">Markers of systemic oxygenation: functional (HR<sup><xref ref-type="table-fn" rid="table1fn17">q</xref></sup>, BR<sup><xref ref-type="table-fn" rid="table1fn18">r</xref></sup>, SBP<sup><xref ref-type="table-fn" rid="table1fn19">s</xref></sup>, and DBP<sup><xref ref-type="table-fn" rid="table1fn20">t</xref></sup>) and biochemical findings (SpO<sub>2</sub>, serum potassium level, and AG<sup><xref ref-type="table-fn" rid="table1fn21">u</xref></sup>)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>CNN<sup><xref ref-type="table-fn" rid="table1fn22">v</xref></sup></p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>MAE<sup><xref ref-type="table-fn" rid="table1fn23">w</xref></sup>: mean 7.941% (SD 4.131%)</p></list-item></list></td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">Xia et al [<xref ref-type="bibr" rid="ref22">22</xref>] (2022)</td><td align="left" valign="top">14,777</td><td align="left" valign="top">29</td><td align="left" valign="top">PaO<sub>2</sub> &#x003C;60 mm Hg after extubating</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>RF</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>AUROC: 0.792</p></list-item></list></td><td align="left" valign="top">No</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>SpO<sub>2</sub>: peripheral oxygen saturation.</p></fn><fn id="table1fn2"><p><sup>b</sup>LSTM: long short-term memory.</p></fn><fn id="table1fn3"><p><sup>c</sup>PPV: positive predictive value.</p></fn><fn id="table1fn4"><p><sup>d</sup>SaO<sub>2</sub>: arterial oxygen saturation.</p></fn><fn id="table1fn5"><p><sup>e</sup>GBT: gradient boosted tree.</p></fn><fn id="table1fn6"><p><sup>f</sup>AUROC: area under the receiver operating characteristics.</p></fn><fn id="table1fn7"><p><sup>g</sup>Lin: linear regression.</p></fn><fn id="table1fn8"><p><sup>h</sup>LR: logistic regression.</p></fn><fn id="table1fn9"><p><sup>i</sup>ANN: artificial neural network.</p></fn><fn id="table1fn10"><p><sup>j</sup>XGB: extreme gradient boosting.</p></fn><fn id="table1fn11"><p><sup>k</sup>RNN: recurrent neural network.</p></fn><fn id="table1fn12"><p><sup>l</sup>GBM: gradient boosting machine.</p></fn><fn id="table1fn13"><p><sup>m</sup>PaO<sub>2</sub>: partial pressure of oxygen.</p></fn><fn id="table1fn14"><p><sup>n</sup>FiO<sub>2</sub>: fraction of inspired oxygen.</p></fn><fn id="table1fn15"><p><sup>o</sup>NN: neural network.</p></fn><fn id="table1fn16"><p><sup>p</sup>RF: random forest.</p></fn><fn id="table1fn17"><p><sup>q</sup>HR: heart rate.</p></fn><fn id="table1fn18"><p><sup>r</sup>BR: breath rate.</p></fn><fn id="table1fn19"><p><sup>s</sup>SBP: systolic blood pressure.</p></fn><fn id="table1fn20"><p><sup>t</sup>DBP: diastolic blood pressure.</p></fn><fn id="table1fn21"><p><sup>u</sup>AG: anion gap.</p></fn><fn id="table1fn22"><p><sup>v</sup>CNN: convolutional neural network.</p></fn><fn id="table1fn23"><p><sup>w</sup>MAE: mean averaged error to the range of values.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2-2"><title>Data Sources and Population</title><p>Most studies (9/12, 75%) analyzed a large sample size of 500 or more patients [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Data from the publicly available databases Medical Information Mart for Intensive Care and eICU Collaborative Research Database were used in 4 of the studies [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], whereas 3 studies relied on data collected via an anesthesia information management system (AIMS) [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. AIMSs are widely adopted hardware and software solutions that are integrated into a hospital&#x2019;s electronic health record system and are used to manage and document a patient&#x2019;s perioperative measurements [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. The studies were set in the OR (n=5) [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], the ICU (n=3) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], and mixed or general care units (n=4) [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Of the 12 studies analyzed, 10 (83%) did not include patients with COVID-19 [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref25">25</xref>], whereas the remaining 2 (17%) studies either were performed only on patients who tested positive for COVID-19 or were externally validated on a COVID-19 cohort [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p></sec><sec id="s3-2-3"><title>ML Model Specifics</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref26">26</xref>] gives an overview of the models and the number of variables used in each study. Exclusively conventional ML algorithms were applied in 5 of the identified studies [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], whereas 7 studies included deep learning algorithms [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Models based on logistic regression were used most often (n=4) [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>], followed by artificial neural networks (n=3) [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Machine learning (ML) methods used by each study. ML methods (upper half) in gray: conventional ML; ML methods in black: deep learning. Studies are sorted by the number of clinical variables used. Studies in blue: 1 clinical variable; studies in green: 2-5 clinical variables; studies in yellow to red: &#x003E;5 clinical variables. ANN: artificial neural network; Autoreg: autoregressive model; CNN: convolutional neural network; DTW: dynamic time warping; GBM: gradient boosting machine; GBT: gradient boosted tree; kNN: k-nearest neighbor; Lin: linear regression; LR: logistic regression; LSTM: long short-term memory; RF: random forest; RNN: recurrent neural network; SVM: support vector machine; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e50642_fig02.png"/></fig><p>The number of clinical variables included ranged from 1 to over 65 different variables. The prediction of hypoxic events was based solely on prior peripheral oxygen saturation (SpO<sub>2</sub>) values in 3 studies [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], whereas 4 studies used 2 or 3 clinical variables as input [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. The remaining 5 studies relied on at least 6 variables [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The most frequently used variable sources were oximetry measurements (9/12, 75%) [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] and static patient characteristics such as age (5/12, 42%) [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Additionally, a single study relied on diagnostic images of the chest to make predictions [<xref ref-type="bibr" rid="ref26">26</xref>].</p><p>The prediction end point was defined by a threshold of SpO<sub>2</sub> between 89% and 92% for most of the studies (7/12, 58%) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Thresholds of the partial pressure of oxygen, the arterial oxygen saturation, or the ratio of partial pressure of oxygen to the fraction of inspired oxygen were used in 3 other studies [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. The remaining 2 studies assessed the presence and severity of hypoxia as defined by expert annotations and predicted functional markers of hypoxia, respectively [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Defined time frames for prediction included the length of a certain procedure [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>], any time after extubating [<xref ref-type="bibr" rid="ref22">22</xref>], and a set time window of 5 to 30 minutes [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec><sec id="s3-2-4"><title>Performance</title><p>Most of the 12 studies reported sensitivity (n=9, 75%), specificity (n=8, 67%), or AUROC (n=9, 75%) as classification measures. Other performance indicators were PPV, NPV, area under the precision-recall curve, accuracy, and <italic>F</italic><sub>1</sub>-score. The most frequently reported performance measures of the best-performing model in each study are summarized in a heat map (<xref ref-type="fig" rid="figure3">Figure 3</xref> [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]). The reported performance measures of 1 study were based on 10 individual patients since the focus of the study was to propose a performance metric and therefore have limited informative value [<xref ref-type="bibr" rid="ref17">17</xref>]. One other study only reported the proportion of the mean averaged error to the range of values [<xref ref-type="bibr" rid="ref26">26</xref>].</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Heat map of performance measures, sorted by AUROC. The performance of the best-performing model in each study is presented. In the case of studies that examined multiple prediction outcomes, the outcome definition that is the most similar to the other studies was chosen for reporting. For studies stating 1 performance value per patient, the metrics represent the mean value. For 3 of the included studies, hypoxia prediction was not the main study aim [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. The reported performance measures of 1 study were based on 10 individual patients and therefore have limited informative value. One study only reported the proportion of the mean averaged error to the range of values. AUROC: area under the receiver operating characteristics; NPV: negative predictive value; PPV: positive predictive value.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e50642_fig03.png"/></fig><p>Of the 9 studies reporting AUROC, 8 (89%) showed a value higher than 0.75 [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. This included 3 studies that showed a significant trade-off between sensitivity and specificity [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The overall performance was moderate or high with respect to classification metrics, both in studies performing the prediction task as the main study aim and in studies predicting hypoxia as a side or auxiliary goal. In studies drawing a comparison to anesthesiologist decisions, the prediction models alone or anesthesiologists using those models outperformed anesthesiologists without access to the model [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>Deep learning and conventional ML are not directly comparable as they are not being applied on the same data set and the performance metrics are not consistently reported. However, in all studies comparing the 2 approaches, deep learning models showed similar or better performance than conventional ML models considering classification metrics [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Additionally, models only using prior SpO<sub>2</sub> data as a variable tended to outperform models using more clinical variables [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Two (67%) of the 3 studies only using prior SpO<sub>2</sub> data applied a long short-term memory (LSTM) algorithm, 1 of which was able to predict the detailed trend of the SpO<sub>2</sub> waveform [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Multitask learning for the prediction of related end points was implemented in 1 study, showing improved performance with an increasing number of tasks [<xref ref-type="bibr" rid="ref19">19</xref>]. Approaches for providing explainability of their prediction outcome were presented in 2 studies, with 1 offering a real-time prediction tool displaying the contributing factors of an individual patient&#x2019;s hypoxemia risk within the next 5 minutes [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec></sec><sec id="s3-3"><title>Risk-of-Bias Assessment</title><p>PROBAST was used to assess the risk of bias and applicability of each study. In the case of external validation, the assessment for that validation was performed separately. An overview of the overall and segment ratings of all 12 studies analyzed are shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>. The overall risk of bias was rated as high or unclear for most of the studies (10/12, 83%) [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Unclear or high risk of bias ratings were mainly due to missing details of the procedure as well as unclear or unfitting timing of predictors or outcomes. External validation was only performed in 4 of the studies [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], whereas the other 8 studies relied on internal validation, primarily using random split samples and cross-validation [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref26">26</xref>].</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Risk-of-bias assessment for all studies (n=12) based on 4 segments. The graph shows the number of studies with low, high, and unclear risk of bias by the author&#x2019;s assessment using PROBAST (Prediction Model Risk of Bias Assessment Tool).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e50642_fig04.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this systematic review, we identified and summarized 12 studies predicting hypoxic events or markers for hypoxia. The approaches proved to be highly diverse both in their assessment and definition of a hypoxic outcome as well as in the variables and model types used. Therefore, the comparability between studies was limited by the high variability of approaches, such as the variety of settings involving different influences on blood oxygen saturation (eg, sedation during surgery).</p><p>The data used to develop the models were primarily obtained from publicly available databases or directly from hospitals&#x2019; AIMSs or electronic health record systems. Settings for the prediction included the OR, ICU, and general care units. The implemented ML models were based on both conventional ML and deep learning methods and assessed prediction end points defined as a threshold for blood oxygen measurements for most studies. Clinical variables used included patient characteristics, vital signs, and laboratory data. Blood oxygen data were the most applied model variables for hypoxia prediction.</p><p>The overall predictive performance of the presented models was moderate or high across the various settings. Deep learning approaches showed similar or better performance than conventional ML approaches within the same studies. Models predicting hypoxia solely based on prior oximetry data tended to outperform models using more variables as inputs, with most of these studies using an LSTM algorithm.</p><p>The demonstrated trade-off between sensitivity and specificity of model performance highlights that it may be difficult to achieve both at the same time, especially when predicting medical events. This is a major caveat that holds true for a broad variety of diagnostic tests in medicine, such as D-dimers in investigating venous thromboembolism [<xref ref-type="bibr" rid="ref29">29</xref>]. High specificity but low sensitivity, as demonstrated by 2 of the models, might, for example, result from missing relevant variables or an insufficient number of outcome events due to small sample sizes. An algorithm with high specificity may help to reduce unnecessary interventions, potentially leading to cost savings and minimizing patient inconvenience. However, in practice, an algorithm with that trade-off does not reliably detect patients with hypoxia who require immediate attention and may therefore be more appropriate as a decision support tool rather than a stand-alone diagnostic tool.</p><p>High sensitivity but low specificity on the other hand can, for example, be caused by the inclusion of variables that are highly associated with the presence of hypoxia but are not specific to hypoxia alone, or by the model being too sensitive and thus detecting subtle changes in nonhypoxic cases that are incorrectly classified as hypoxic. Practically, such a model could result in overalerting, disqualifying it for clinical application.</p><p>The informational value of many of the studies presented was limited due to a lack of external validation. In addition, more precise classification performance metrics were often not provided, thus not allowing for a meta-analysis. Unclear ratings were mostly due to missing information, particularly in the analysis segment. Comparability between studies was limited by the high variability of approaches, such as the variety of settings involving different influences on blood oxygen saturation (eg, sedation during surgery).</p></sec><sec id="s4-2"><title>Applicability and Future Opportunities</title><p>The successful prediction of hypoxic events within a time frame of 5 or even 30 minutes into the future demonstrates the ability to provide sufficient lead time for crucial treatment interventions. Hence, these results suggest the potential of developing a helpful prediction tool, applicable in clinical practice, which complements the assessment of nurses and clinicians. Such a tool could be extended by a presentation and visualization of individual factors influencing the predicted outcome of hypoxia, as demonstrated by Lundberg et al [<xref ref-type="bibr" rid="ref20">20</xref>]. The approach to make the model more understandable is useful both for more nuanced therapy strategies and for the general usability and acceptance of an ML tool for the prediction of hypoxia in the clinical setting.</p><p>While models with many features might have higher accuracy and might be able to capture more detailed and complex relationships between the features and the outcome of hypoxia, they also come with a higher complexity for use and are prone to overfitting [<xref ref-type="bibr" rid="ref30">30</xref>]. Given the intended use of a predictive algorithm for making timely decisions that have immediate impact on the health status of patients, complex models with excessive features could impede their implementation in clinical practice. Additionally, utility might be reduced by patients missing 1 or more of these features. Therefore, the prediction results of LSTM models based only on previous SpO<sub>2</sub> values provide a foundation for further development and refinement of models using only a few, readily available, and noninvasive respiratory variables.</p><p>The results of Lam et al [<xref ref-type="bibr" rid="ref19">19</xref>] suggest that multitask learning may contribute to higher predictive performance on related respiratory outcomes. Therefore, an approach for parallel prediction of several relevant intensive care parameters could provide a basis for further exploration. Opportunities for combined prediction include predictive models for the necessity of changes in ventilation, in airway pressure, or for increased risk of ventilation failure [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. The prediction of hypoxia could also be embedded in a more general early warning score for related outcomes, for which ML mechanisms are already being applied [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>]. In addition, the development of ML prediction models in a clinical context should include consideration of recent advances for the prediction of other unrelated health parameters and outcomes to avoid a complex system of different prediction systems, thus limiting the applicability and acceptability of these efforts. Forthcoming studies in this area should strive to accurately report performance details of their models, as well as to consistently define the end point of the prediction, to allow comparison with other approaches.</p></sec><sec id="s4-3"><title>Limitations</title><p>This review focused on studies predicting hypoxic or hypoxemic events and therefore did not include studies predicting related outcomes (eg, blood oxygen saturation) without stating that aim of prediction. The comparability of predictive performance among the included studies was limited due to substantial differences in methodology, variables, and end point definition, precluding a meta-analysis from being conducted. An additional challenge arose from the fact that some studies, while including hypoxia predictions, did so as an auxiliary objective and not as their primary focus. Therefore, we focused on a qualitative summary and on demonstrating the variety of approaches taken. The generalizability of the results presented might be further restricted by the countries of origin being limited to the United States, Europe, and Asia.</p></sec><sec id="s4-4"><title>Conclusion</title><p>Despite the large methodological variance of the studies presented, this review shows promising approaches for the prediction of hypoxia status, a factor that is highly informative for changes to a patient&#x2019;s state of health. Future studies must aim to improve the external validation of the predictive performance and, thus, verify the generalizability of the results to additional data sets. The applicability of validated predictive models for hypoxia risk should be proven by prospective studies in clinical practice.</p></sec></sec></body><back><ack><p>This work was supported by the German Ministry of Education and Research (BMBF), Berlin (#01ZZ2005). The open access publication of this article was supported by the Open Access Fund of the Medical Faculty of the University of Augsburg.</p></ack><fn-group><fn fn-type="con"><p>LCH, BPG, and LP initiated the project. LP and BPG conducted the search. LP, BPG, MK, SS, SZ, MS, SOR, CMW, SG, and JS performed the screening and review. LP and MS conducted the data extraction. LP carried out the synthesis and narrative summary with MS reviewing the process. LP, MK, MS, and LCH substantially contributed to the final manuscript. MK, BPG, JS, MS, and LCH provided constructive comments and discussion on the project. All authors carefully read and commented on the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AIMS</term><def><p>anesthesia information management system</p></def></def-item><def-item><term id="abb3">AUROC</term><def><p>area under the receiver operating characteristics</p></def></def-item><def-item><term id="abb4">ICU</term><def><p>intensive care unit</p></def></def-item><def-item><term id="abb5">LSTM</term><def><p>long short-term memory</p></def></def-item><def-item><term id="abb6">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb7">NPV</term><def><p>negative predictive value</p></def></def-item><def-item><term id="abb8">OR</term><def><p>operating room</p></def></def-item><def-item><term id="abb9">PaO<sub>2</sub></term><def><p>partial pressure of oxygen</p></def></def-item><def-item><term id="abb10">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb11">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item><def-item><term id="abb12">PROBAST</term><def><p>Prediction Model Risk of Bias Assessment Tool</p></def></def-item><def-item><term id="abb13">PROSPERO</term><def><p>International Prospective Register of Systematic Reviews</p></def></def-item><def-item><term id="abb14">SpO<sub>2</sub></term><def><p>peripheral oxygen saturation</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Bhutta</surname><given-names>BS</given-names></name><name name-style="western"><surname>Alghoula</surname><given-names>F</given-names></name><name name-style="western"><surname>Berim</surname><given-names>I</given-names></name></person-group><article-title>Hypoxia</article-title><source>StatPearls</source><year>2023</year><publisher-name>StatPearls Publishing</publisher-name><pub-id pub-id-type="medline">29493941</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pittman</surname><given-names>RN</given-names></name></person-group><article-title>Regulation of tissue oxygenation</article-title><source>Colloquium Series on Integrated Systems Physiology</source><year>2011</year><volume>3</volume><issue>3</issue><fpage>1</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.4199/C00029ED1V01Y201103ISP017</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Sood</surname><given-names>S</given-names></name><name name-style="western"><surname>Manaker</surname><given-names>S</given-names></name><name name-style="western"><surname>Finlay</surname><given-names>G</given-names></name></person-group><article-title>Evaluation and management of the nonventilated, hospitalized adult patient with acute hypoxemia</article-title><source>UpToDate</source><year>2022</year><month>09</month><day>8</day><access-date>2023-02-22</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.uptodate.com/contents/evaluation-and-management-of-the-nonventilated-hospitalized-adult-patient-with-acute-hypoxemia">www.uptodate.com/contents/evaluation-and-management-of-the-nonventilated-hospitalized-adult-patient-with-acute-hypoxemia</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Aronson</surname><given-names>LA</given-names></name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Atlee</surname><given-names>JL</given-names></name></person-group><article-title>Hypoxemia</article-title><source>Complications in Anesthesia</source><year>2007</year><edition>2</edition><publisher-name>Saunders</publisher-name><fpage>637</fpage><lpage>640</lpage></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>SRLF Trial Group</collab></person-group><article-title>Hypoxemia in the ICU: prevalence, treatment, and outcome</article-title><source>Ann Intensive Care</source><year>2018</year><month>08</month><day>13</day><volume>8</volume><issue>1</issue><fpage>82</fpage><pub-id pub-id-type="doi">10.1186/s13613-018-0424-4</pub-id><pub-id pub-id-type="medline">30105416</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Akazawa</surname><given-names>M</given-names></name><name name-style="western"><surname>Hashimoto</surname><given-names>K</given-names></name></person-group><article-title>Artificial intelligence in gynecologic cancers: current status and future challenges - a systematic review</article-title><source>Artif Intell Med</source><year>2021</year><month>10</month><volume>120</volume><fpage>102164</fpage><pub-id pub-id-type="doi">10.1016/j.artmed.2021.102164</pub-id><pub-id pub-id-type="medline">34629152</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuntz</surname><given-names>S</given-names></name><name name-style="western"><surname>Krieghoff-Henning</surname><given-names>E</given-names></name><name name-style="western"><surname>Kather</surname><given-names>JN</given-names></name><etal/></person-group><article-title>Gastrointestinal cancer classification and prognostication from histology using deep learning: systematic review</article-title><source>Eur J Cancer</source><year>2021</year><month>09</month><volume>155</volume><fpage>200</fpage><lpage>215</lpage><pub-id pub-id-type="doi">10.1016/j.ejca.2021.07.012</pub-id><pub-id pub-id-type="medline">34391053</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hamet</surname><given-names>P</given-names></name><name name-style="western"><surname>Tremblay</surname><given-names>J</given-names></name></person-group><article-title>Artificial intelligence in medicine</article-title><source>Metabolism</source><year>2017</year><month>04</month><volume>69S</volume><fpage>S36</fpage><lpage>S40</lpage><pub-id pub-id-type="doi">10.1016/j.metabol.2017.01.011</pub-id><pub-id pub-id-type="medline">28126242</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nadarajah</surname><given-names>R</given-names></name><name name-style="western"><surname>Wu</surname><given-names>J</given-names></name><name name-style="western"><surname>Frangi</surname><given-names>AF</given-names></name><name name-style="western"><surname>Hogg</surname><given-names>D</given-names></name><name name-style="western"><surname>Cowan</surname><given-names>C</given-names></name><name name-style="western"><surname>Gale</surname><given-names>C</given-names></name></person-group><article-title>Predicting patient-level new-onset atrial fibrillation from population-based nationwide electronic health records: protocol of FIND-AF for developing a precision medicine prediction model using artificial intelligence</article-title><source>BMJ Open</source><year>2021</year><month>11</month><day>2</day><volume>11</volume><issue>11</issue><fpage>e052887</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2021-052887</pub-id><pub-id pub-id-type="medline">34728455</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gunasekeran</surname><given-names>DV</given-names></name><name name-style="western"><surname>Ting</surname><given-names>DSW</given-names></name><name name-style="western"><surname>Tan</surname><given-names>GSW</given-names></name><name name-style="western"><surname>Wong</surname><given-names>TY</given-names></name></person-group><article-title>Artificial intelligence for diabetic retinopathy screening, prediction and management</article-title><source>Curr Opin Ophthalmol</source><year>2020</year><month>09</month><volume>31</volume><issue>5</issue><fpage>357</fpage><lpage>365</lpage><pub-id pub-id-type="doi">10.1097/ICU.0000000000000693</pub-id><pub-id pub-id-type="medline">32740069</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Page</surname><given-names>MJ</given-names></name><name name-style="western"><surname>McKenzie</surname><given-names>JE</given-names></name><name name-style="western"><surname>Bossuyt</surname><given-names>PM</given-names></name><etal/></person-group><article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title><source>BMJ</source><year>2021</year><month>03</month><day>29</day><volume>372</volume><fpage>n71</fpage><pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id><pub-id pub-id-type="medline">33782057</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Harzing</surname><given-names>AW</given-names></name></person-group><article-title>Publish or Perish</article-title><source>Harzing.com</source><year>2016</year><month>02</month><day>6</day><access-date>2022-11-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://harzing.com/resources/publish-or-perish">https://harzing.com/resources/publish-or-perish</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="web"><article-title>Covidence - better systematic review management</article-title><source>Covidence</source><access-date>2022-11-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.covidence.org">www.covidence.org</ext-link></comment></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names></name><name name-style="western"><surname>Wolff</surname><given-names>RF</given-names></name><name name-style="western"><surname>Riley</surname><given-names>RD</given-names></name><etal/></person-group><article-title>PROBAST: a tool to assess risk of bias and applicability of prediction model studies: explanation and elaboration</article-title><source>Ann Intern Med</source><year>2019</year><month>01</month><day>1</day><volume>170</volume><issue>1</issue><fpage>W1</fpage><lpage>W33</lpage><pub-id pub-id-type="doi">10.7326/M18-1377</pub-id><pub-id pub-id-type="medline">30596876</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Annapragada</surname><given-names>AV</given-names></name><name name-style="western"><surname>Greenstein</surname><given-names>JL</given-names></name><name name-style="western"><surname>Bose</surname><given-names>SN</given-names></name><name name-style="western"><surname>Winters</surname><given-names>BD</given-names></name><name name-style="western"><surname>Sarma</surname><given-names>SV</given-names></name><name name-style="western"><surname>Winslow</surname><given-names>RL</given-names></name></person-group><article-title>SWIFT: a deep learning approach to prediction of hypoxemic events in critically-ill patients using SpO2 waveform prediction</article-title><source>PLoS Comput Biol</source><year>2021</year><month>12</month><day>21</day><volume>17</volume><issue>12</issue><fpage>e1009712</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1009712</pub-id><pub-id pub-id-type="medline">34932550</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>H</given-names></name><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names></name><name name-style="western"><surname>Erion</surname><given-names>G</given-names></name><name name-style="western"><surname>Kim</surname><given-names>JH</given-names></name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names></name></person-group><article-title>Forecasting adverse surgical events using self-supervised transfer learning for physiological signals</article-title><source>NPJ Digit Med</source><year>2021</year><month>12</month><day>8</day><volume>4</volume><issue>1</issue><fpage>167</fpage><pub-id pub-id-type="doi">10.1038/s41746-021-00536-y</pub-id><pub-id pub-id-type="medline">34880410</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>ElMoaqet</surname><given-names>H</given-names></name><name name-style="western"><surname>Tilbury</surname><given-names>DM</given-names></name><name name-style="western"><surname>Ramachandran</surname><given-names>SK</given-names></name></person-group><article-title>Evaluating predictions of critical oxygen desaturation events</article-title><source>Physiol Meas</source><year>2014</year><month>04</month><volume>35</volume><issue>4</issue><fpage>639</fpage><lpage>655</lpage><pub-id pub-id-type="doi">10.1088/0967-3334/35/4/639</pub-id><pub-id pub-id-type="medline">24621948</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Erion</surname><given-names>G</given-names></name><name name-style="western"><surname>Chen</surname><given-names>H</given-names></name><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names></name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names></name></person-group><article-title>Anesthesiologist-level forecasting of hypoxemia with only SpO2 data using deep learning</article-title><source>arXiv</source><comment>Preprint posted online on Dec 2, 2017</comment><pub-id pub-id-type="doi">10.48550/arXiv.1712.00563</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lam</surname><given-names>C</given-names></name><name name-style="western"><surname>Thapa</surname><given-names>R</given-names></name><name name-style="western"><surname>Maharjan</surname><given-names>J</given-names></name><etal/></person-group><article-title>Multitask learning with recurrent neural networks for acute respiratory distress syndrome prediction using only electronic health record data: model development and validation study</article-title><source>JMIR Med Inform</source><year>2022</year><month>06</month><day>15</day><volume>10</volume><issue>6</issue><fpage>e36202</fpage><pub-id pub-id-type="doi">10.2196/36202</pub-id><pub-id pub-id-type="medline">35704370</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names></name><name name-style="western"><surname>Nair</surname><given-names>B</given-names></name><name name-style="western"><surname>Vavilala</surname><given-names>MS</given-names></name><etal/></person-group><article-title>Explainable machine-learning predictions for the prevention of hypoxaemia during surgery</article-title><source>Nat Biomed Eng</source><year>2018</year><month>10</month><volume>2</volume><issue>10</issue><fpage>749</fpage><lpage>760</lpage><pub-id pub-id-type="doi">10.1038/s41551-018-0304-0</pub-id><pub-id pub-id-type="medline">31001455</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ren</surname><given-names>S</given-names></name><name name-style="western"><surname>Zupetic</surname><given-names>JA</given-names></name><name name-style="western"><surname>Tabary</surname><given-names>M</given-names></name><etal/></person-group><article-title>Machine learning based algorithms to impute PaO2 from SpO2 values and development of an online calculator</article-title><source>Sci Rep</source><year>2022</year><month>05</month><day>17</day><volume>12</volume><issue>1</issue><fpage>8235</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-12419-7</pub-id><pub-id pub-id-type="medline">35581469</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xia</surname><given-names>M</given-names></name><name name-style="western"><surname>Jin</surname><given-names>C</given-names></name><name name-style="western"><surname>Cao</surname><given-names>S</given-names></name><etal/></person-group><article-title>Development and validation of a machine-learning model for prediction of hypoxemia after extubation in intensive care units</article-title><source>Ann Transl Med</source><year>2022</year><month>05</month><volume>10</volume><issue>10</issue><fpage>577</fpage><pub-id pub-id-type="doi">10.21037/atm-22-2118</pub-id><pub-id pub-id-type="medline">35722375</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geng</surname><given-names>W</given-names></name><name name-style="western"><surname>Jia</surname><given-names>D</given-names></name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names></name><etal/></person-group><article-title>A prediction model for hypoxemia during routine sedation for gastrointestinal endoscopy</article-title><source>Clinics (Sao Paulo)</source><year>2018</year><month>11</month><day>14</day><volume>73</volume><fpage>e513</fpage><pub-id pub-id-type="doi">10.6061/clinics/2018/e513</pub-id><pub-id pub-id-type="medline">30462756</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geng</surname><given-names>W</given-names></name><name name-style="western"><surname>Tang</surname><given-names>H</given-names></name><name name-style="western"><surname>Sharma</surname><given-names>A</given-names></name><name name-style="western"><surname>Zhao</surname><given-names>Y</given-names></name><name name-style="western"><surname>Yan</surname><given-names>Y</given-names></name><name name-style="western"><surname>Hong</surname><given-names>W</given-names></name></person-group><article-title>An artificial neural network model for prediction of hypoxemia during sedation for gastrointestinal endoscopy</article-title><source>J Int Med Res</source><year>2019</year><month>05</month><volume>47</volume><issue>5</issue><fpage>2097</fpage><lpage>2103</lpage><pub-id pub-id-type="doi">10.1177/0300060519834459</pub-id><pub-id pub-id-type="medline">30913936</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sippl</surname><given-names>P</given-names></name><name name-style="western"><surname>Ganslandt</surname><given-names>T</given-names></name><name name-style="western"><surname>Prokosch</surname><given-names>HU</given-names></name><name name-style="western"><surname>Muenster</surname><given-names>T</given-names></name><name name-style="western"><surname>Toddenroth</surname><given-names>D</given-names></name></person-group><article-title>Machine learning models of post-intubation hypoxia during general anesthesia</article-title><source>Stud Health Technol Inform</source><year>2017</year><volume>243</volume><fpage>212</fpage><lpage>216</lpage><pub-id pub-id-type="doi">10.3233/978-1-61499-808-2-212</pub-id><pub-id pub-id-type="medline">28883203</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Statsenko</surname><given-names>Y</given-names></name><name name-style="western"><surname>Habuza</surname><given-names>T</given-names></name><name name-style="western"><surname>Talako</surname><given-names>T</given-names></name><etal/></person-group><article-title>Deep learning-based automatic assessment of lung impairment in COVID-19 pneumonia: predicting markers of hypoxia with computer vision</article-title><source>Front Med (Lausanne)</source><year>2022</year><month>07</month><day>9</day><volume>9</volume><fpage>882190</fpage><pub-id pub-id-type="doi">10.3389/fmed.2022.882190</pub-id><pub-id pub-id-type="medline">35957860</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Simpao</surname><given-names>AF</given-names></name><name name-style="western"><surname>Rehman</surname><given-names>MA</given-names></name></person-group><article-title>Anesthesia information management systems</article-title><source>Anesth Analg</source><year>2018</year><month>07</month><volume>127</volume><issue>1</issue><fpage>90</fpage><lpage>94</lpage><pub-id pub-id-type="doi">10.1213/ANE.0000000000002545</pub-id><pub-id pub-id-type="medline">29049075</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shah</surname><given-names>NJ</given-names></name><name name-style="western"><surname>Tremper</surname><given-names>KK</given-names></name><name name-style="western"><surname>Kheterpal</surname><given-names>S</given-names></name></person-group><article-title>Anatomy of an anesthesia information management system</article-title><source>Anesthesiol Clin</source><year>2011</year><month>09</month><volume>29</volume><issue>3</issue><fpage>355</fpage><lpage>365</lpage><pub-id pub-id-type="doi">10.1016/j.anclin.2011.05.013</pub-id><pub-id pub-id-type="medline">21871398</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weitz</surname><given-names>JI</given-names></name><name name-style="western"><surname>Fredenburgh</surname><given-names>JC</given-names></name><name name-style="western"><surname>Eikelboom</surname><given-names>JW</given-names></name></person-group><article-title>A test in context: D-dimer</article-title><source>J Am Coll Cardiol</source><year>2017</year><month>11</month><day>7</day><volume>70</volume><issue>19</issue><fpage>2411</fpage><lpage>2420</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2017.09.024</pub-id><pub-id pub-id-type="medline">29096812</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>RC</given-names></name><name name-style="western"><surname>Dewi</surname><given-names>C</given-names></name><name name-style="western"><surname>Huang</surname><given-names>SW</given-names></name><name name-style="western"><surname>Caraka</surname><given-names>RE</given-names></name></person-group><article-title>Selecting critical features for data classification based on machine learning methods</article-title><source>J Big Data</source><year>2020</year><month>07</month><day>23</day><volume>7</volume><fpage>52</fpage><pub-id pub-id-type="doi">10.1186/s40537-020-00327-4</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>QY</given-names></name><name name-style="western"><surname>Wang</surname><given-names>H</given-names></name><name name-style="western"><surname>Luo</surname><given-names>JC</given-names></name><etal/></person-group><article-title>Development and validation of a machine-learning model for prediction of extubation failure in intensive care units</article-title><source>Front Med (Lausanne)</source><year>2021</year><month>05</month><day>17</day><volume>8</volume><fpage>676343</fpage><pub-id pub-id-type="doi">10.3389/fmed.2021.676343</pub-id><pub-id pub-id-type="medline">34079812</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shashikumar</surname><given-names>SP</given-names></name><name name-style="western"><surname>Wardi</surname><given-names>G</given-names></name><name name-style="western"><surname>Paul</surname><given-names>P</given-names></name><etal/></person-group><article-title>Development and prospective validation of a deep learning algorithm for predicting need for mechanical ventilation</article-title><source>Chest</source><year>2021</year><month>06</month><volume>159</volume><issue>6</issue><fpage>2264</fpage><lpage>2273</lpage><pub-id pub-id-type="doi">10.1016/j.chest.2020.12.009</pub-id><pub-id pub-id-type="medline">33345948</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Igarashi</surname><given-names>Y</given-names></name><name name-style="western"><surname>Ogawa</surname><given-names>K</given-names></name><name name-style="western"><surname>Nishimura</surname><given-names>K</given-names></name><name name-style="western"><surname>Osawa</surname><given-names>S</given-names></name><name name-style="western"><surname>Ohwada</surname><given-names>H</given-names></name><name name-style="western"><surname>Yokobori</surname><given-names>S</given-names></name></person-group><article-title>Machine learning for predicting successful extubation in patients receiving mechanical ventilation</article-title><source>Front Med (Lausanne)</source><year>2022</year><month>08</month><day>11</day><volume>9</volume><fpage>961252</fpage><pub-id pub-id-type="doi">10.3389/fmed.2022.961252</pub-id><pub-id pub-id-type="medline">36035403</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fang</surname><given-names>AHS</given-names></name><name name-style="western"><surname>Lim</surname><given-names>WT</given-names></name><name name-style="western"><surname>Balakrishnan</surname><given-names>T</given-names></name></person-group><article-title>Early warning score validation methodologies and performance metrics: a systematic review</article-title><source>BMC Med Inform Decis Mak</source><year>2020</year><month>06</month><day>18</day><volume>20</volume><issue>1</issue><fpage>111</fpage><pub-id pub-id-type="doi">10.1186/s12911-020-01144-8</pub-id><pub-id pub-id-type="medline">32552702</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Romero-Brufau</surname><given-names>S</given-names></name><name name-style="western"><surname>Whitford</surname><given-names>D</given-names></name><name name-style="western"><surname>Johnson</surname><given-names>MG</given-names></name><etal/></person-group><article-title>Using machine learning to improve the accuracy of patient deterioration predictions: Mayo Clinic Early Warning Score (MC-EWS)</article-title><source>J Am Med Inform Assoc</source><year>2021</year><month>06</month><day>12</day><volume>28</volume><issue>6</issue><fpage>1207</fpage><lpage>1215</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocaa347</pub-id><pub-id pub-id-type="medline">33638343</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Winslow</surname><given-names>CJ</given-names></name><name name-style="western"><surname>Edelson</surname><given-names>DP</given-names></name><name name-style="western"><surname>Churpek</surname><given-names>MM</given-names></name><etal/></person-group><article-title>The impact of a machine learning early warning score on hospital mortality: a multicenter clinical intervention trial</article-title><source>Crit Care Med</source><year>2022</year><month>09</month><day>1</day><volume>50</volume><issue>9</issue><fpage>1339</fpage><lpage>1347</lpage><pub-id pub-id-type="doi">10.1097/CCM.0000000000005492</pub-id><pub-id pub-id-type="medline">35452010</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Search strategy, data sources, and clinical variables.</p><media xlink:href="medinform_v12i1e50642_app1.docx" xlink:title="DOCX File, 34 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) checklist.</p><media xlink:href="medinform_v12i1e50642_app2.docx" xlink:title="DOCX File, 36 KB"/></supplementary-material></app-group></back></article>