<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e82762</article-id><article-id pub-id-type="doi">10.2196/82762</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Online Sepsis Prediction Using Vital Signs and Multiscale Temporal-Aware Contrastive Learning: Model Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Yang</surname><given-names>Xiaoqiong</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lv</surname><given-names>Zezhong</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lv</surname><given-names>Hanming</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhou</surname><given-names>Qianyi</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jiang</surname><given-names>Wei</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Meng</surname><given-names>Ziqun</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Yang</surname><given-names>Wenjie</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Infectious Diseases, Tianjin First Central Hospital</institution><addr-line>Baoshan West Road, 2nd</addr-line><addr-line>Tianjin</addr-line><country>China</country></aff><aff id="aff2"><institution>School of Control Science and Engineering, Tiangong University</institution><addr-line>Tianjin</addr-line><country>China</country></aff><aff id="aff3"><institution>School of Textile Science and Engineering, Tiangong University</institution><addr-line>Tianjin</addr-line><country>China</country></aff><aff id="aff4"><institution>Clinical Medical College, Tianjin Medical University</institution><addr-line>Tianjin</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wu</surname><given-names>Di</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhu</surname><given-names>Tingting</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Wenjie Yang, MS, Department of Infectious Diseases, Tianjin First Central Hospital, Baoshan West Road, 2nd, Tianjin, 300190, China, (86) 13602155376; <email>yangm8006@sina.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>19</day><month>6</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e82762</elocation-id><history><date date-type="received"><day>21</day><month>08</month><year>2025</year></date><date date-type="rev-recd"><day>22</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>16</day><month>05</month><year>2026</year></date></history><copyright-statement>&#x00A9; Xiaoqiong Yang, Zezhong Lv, Hanming Lv, Qianyi Zhou, Wei Jiang, Ziqun Meng, Wenjie Yang. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 19.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2026/1/e82762"/><abstract><sec><title>Background</title><p>Real-time prediction of sepsis is a critical yet highly challenging task. Existing studies face 2 major limitations. First, they often rely on laboratory test results that are not readily available in real time, making timely diagnosis difficult. Second, the patient&#x2019;s condition evolves as a typical time series, but current methods often adopt coarse modeling strategies, with model architectures that are inefficient to train and deploy effectively.</p></sec><sec><title>Objective</title><p>This study aimed to develop a prediction model for online sepsis detection using only easily obtainable vital signs, such as heart rate and temperature, with variable-length input sequences while maintaining high predictive performance through the multiscale temporal representation learning.</p></sec><sec sec-type="methods"><title>Methods</title><p>We propose a deep learning model, Multi-Scale Temporal-aware Contrastive Learning (MSTCL), for efficient sepsis prediction based on the intensive care unit data derived from publicly available databases. We propose a multiscale temporal model to capture both short- and long-term dependencies in variable-length physiological time series. To enhance the robustness of our model, we used contrastive learning techniques that differentiate between positive and negative sepsis progression trajectories. Input features were limited to 6 vital signs, without reliance on laboratory tests or clinical notes.</p></sec><sec sec-type="results"><title>Results</title><p>The model was evaluated on more than 400 patients with and without sepsis. It achieved an area under the receiver operating characteristic curve of 88.34%, a sensitivity of 89.29%, and a specificity of 73% for predicting sepsis onset based on variable-length vital-sign histories. The normalized mean absolute error for the predicted sepsis onset was 0.11%.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Our proposed model&#x2019;s low complexity and rapid inference make it suitable for deployment in real-time monitoring systems and low-resource environments. The ability to learn from variable-length historical data enhances the clinical applicability of our model. Furthermore, the methodology of temporal-aware contrastive learning offers a robust and efficient solution for online sepsis detection in diverse clinical settings.</p></sec></abstract><kwd-group><kwd>sepsis prediction</kwd><kwd>deep learning</kwd><kwd>vital signs monitoring</kwd><kwd>temporal modeling</kwd><kwd>contrastive learning</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Sepsis is a life-threatening clinical syndrome caused by a dysregulated host response to infection, leading to acute organ dysfunction [<xref ref-type="bibr" rid="ref1">1</xref>]. It is a major global health concern, accounting for an estimated 270,000 deaths annually, nearly 30% of all hospital deaths [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Timely identification and early intervention are critical for improving patient outcomes, as delays in treatment significantly increase mortality and morbidity [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Accordingly, the development of accurate and timely predictive models for sepsis onset remains a high-priority task in clinical informatics, with the potential to substantially reduce adverse outcomes through early clinical alerts and proactive management.</p><p>Traditional approaches to sepsis prediction, such as the Sequential Organ Failure Assessment and quick Sequential Organ Failure Assessment scores [<xref ref-type="bibr" rid="ref6">6</xref>], are widely used in clinical practice. These scoring systems rely on predefined thresholds and combinations of physiological and laboratory measurements to assess patient risk. However, their performance is limited by relatively low sensitivity, especially in the early stages of sepsis [<xref ref-type="bibr" rid="ref7">7</xref>]. Moreover, their reliance on laboratory-based values restricts their applicability in settings where such information is delayed or unavailable [<xref ref-type="bibr" rid="ref8">8</xref>]. As a result, there has been growing interest in leveraging machine learning and, more recently, deep learning approaches to improve predictive performance in sepsis detection.</p><p>Deep learning methods have shown promising results in sepsis prediction tasks [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], particularly models based on recurrent neural networks (eg, long short-term memory [LSTM] networks) and convolutional neural networks (CNNs). These models can capture temporal patterns and nonlinear dependencies in high-dimensional physiological data. For example, the Smart Sepsis Predictor [<xref ref-type="bibr" rid="ref10">10</xref>], using an LSTM-CNN-fully connected architecture trained on intensive care unit (ICU) data, achieved an area under the receiver operating characteristic curve (AUROC) of up to 0.89 using only demographic and vital sign features, and up to 0.92 when laboratory data were included. Another large-scale study [<xref ref-type="bibr" rid="ref11">11</xref>] used only 5 vital signs and patient age to predict sepsis mortality within 6 to 48 hours, reporting areas under the curve (AUCs) of 0.84 for CNN and 0.761 for LSTM for a 6-hour lead time. Though promising, many of these approaches suffer from practical limitations: they often require a large number of input features, including laboratory results, demographics, and textual data, which limits their deployment in real-time or low-resource settings. Additionally, many models assume fixed-length input sequences, which is incongruent with the inherently irregular and variable-length nature of clinical time-series data. These constraints hinder the usability and generalizability of existing methods across diverse clinical environments.</p><p>Recently, transformer-based models [<xref ref-type="bibr" rid="ref12">12</xref>] have emerged as powerful alternatives for sequence modeling tasks. Originally designed for natural language processing, transformers excel in capturing temporal dependencies through self-attention mechanisms, without relying on recurrent structures. The ability to model sequential data makes transformers particularly well-suited to clinical applications, where patient data may evolve at varying rhythms and durations. For instance, Tang et al [<xref ref-type="bibr" rid="ref13">13</xref>] proposed CNN-transformer and LSTM-transformer hybrid models for early sepsis prediction, demonstrating nearly 20% improvement over baseline recurrent neural network models for 4- to 12-hour preonset windows. Another recent study by Chang et al [<xref ref-type="bibr" rid="ref14">14</xref>] designed a transformer-based diffusion probabilistic model to forecast vital signs (heart rate, systolic blood pressure, and diastolic blood pressure) in ICU patients, achieving substantial gains in inference speed over baselines using MIMIC-III data [<xref ref-type="bibr" rid="ref15">15</xref>]. However, existing transformer-based approaches often still rely on relatively rich sets of inputs&#x2014;including laboratory measurements and demographic features&#x2014;or presume that sufficient historical data are available.</p><p>In this work, we harnessed the strengths of the transformer architecture to build a lightweight, flexible, and high-performing model for real-time sepsis prediction. Specifically, we proposed Multi-Scale Temporal-aware Contrastive Learning (MSTCL), which models the temporal dependencies in routinely monitored vital signs. Unlike conventional approaches that require a fixed window of input data, our model supports variable-length sequences and enables efficient online inference through an autoregressive encoder-decoder design. This allows real-time prediction of sepsis onset using only a short and dynamically updating history of patient monitoring data, making it suitable for real-time warning systems in intensive care and emergency settings.</p><p>To further enhance the model&#x2019;s robustness and applicability in diverse clinical conditions, we intentionally restricted the input features to 6 easily obtainable and commonly monitored vital signs: oxygen saturation, heart rate, body temperature, systolic blood pressure, diastolic blood pressure, and respiratory rate. While this focus on noninvasive data distinguishes our work from methods relying on exhaustive laboratory results, it introduces a significant technical challenge: the reduction in input features may limit the model&#x2019;s ability to capture the subtle, high-dimensional physiological precursors of sepsis. To bridge this information gap and ensure high predictive performance despite the simplified inputs, we proposed the MSTCL framework.</p><p>Specifically, in this study, we proposed a hybrid contrastive learning objective that distinguishes patient vital sign sequences from 3 perspectives: positive segments, negative segments, and full sequences, with the last serving as transitional intermediaries. By enforcing distinct distances among the representations of these 3 types of sequences, the model achieves more stable perception of complex dependencies within patient data streams.</p><p>In summary, the proposed framework enables multiscale temporal modeling and contrastive representation learning in a lightweight, autoregressive architecture, consuming only 6 vital signs as input. This enables real-time, variable-length sepsis prediction across diverse clinical environments. Our approach demonstrates that accurate online prediction of sepsis is feasible using easily obtainable physiological data while maintaining robust generalization and operational efficiency.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Dataset</title><p>The training and testing data used in this study were sampled from the publicly available PhysioNet Computing in Cardiology 2019 Challenge dataset [<xref ref-type="bibr" rid="ref16">16</xref>]. This dataset includes ICU records from patients in 3 different hospitals, of which data from 2 hospitals are openly accessible. These 2 sources provide a total of 40,336 patient records, each containing hourly time-stamped information on demographics, vital signs, and laboratory values, which is referred to in this paper as the &#x201C;original dataset.&#x201D; However, most of these records are temporally sparse. In many cases, even over dozens of recorded hours, most laboratory values and some vital signs had only a few valid entries. This sparsity highlights the difficulty of obtaining real-time laboratory values in most clinical settings, which in turn motivates our study: to enable real-time sepsis prediction using only easily monitored and frequently available vital signs. To achieve this, we applied the following data filtering procedure. First, we separated the original dataset into records of patients with sepsis (with confirmed sepsis onset) and patients without sepsis (entirely negative throughout the ICU stay). For nonseptic records, we randomly sampled sequences in which the missing rate of vital signs was no more than 50%. For septic records, we first identified the sepsis onset point and then examined a 16-hour window surrounding it. If the missing rate of the 6 selected vital signs within that window was less than 50%, the record was retained in our dataset. This selection was based on the assumption that, to train a real-time predictive model&#x2014;especially when using a limited number of input variables&#x2014;the training data must exhibit reasonably high temporal quality. Only with sufficient continuity and density in the input signals can the model effectively learn and capture the underlying temporal dependencies necessary for accurate sepsis onset prediction. <xref ref-type="table" rid="table1">Table 1</xref> summarizes the overall demographics of the data sampled from the source dataset for training and testing in this study. The number of qualified vital sign sequences from positive and negative patients was 1093 and 2673, respectively, totaling 3766 sequences&#x2014;less than one-tenth of the original dataset size of 40,336. The sex ratio and age distribution of the sampled dataset were generally consistent with those of the original dataset. For both positive and negative patients, the number of samples increased progressively with age. The age distribution of positive patients exhibited a more pronounced long-tail pattern compared with that of negative patients. Due to the temporal sparsity of the original PhysioNet Challenge data, we trained and evaluated the proposed MSTCL framework based on these processed samples, which were split into training and test sets using a 4:1 ratio.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Demographic characteristics of patients with sepsis and patients without sepsis.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Demographic variables</td><td align="left" valign="bottom">Septic (n=1093), n (%)</td><td align="left" valign="bottom">Nonseptic (n=2673), n (%)</td><td align="left" valign="bottom">Overall (n=3766), n (%)</td><td align="left" valign="bottom">Original data (n=40,336) [<xref ref-type="bibr" rid="ref16">16</xref>], n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Male</td><td align="left" valign="top">656 (60)</td><td align="left" valign="top">1823 (68.2)</td><td align="left" valign="top">2478 (65.8)</td><td align="left" valign="top">22,568 (56)</td></tr><tr><td align="left" valign="top" colspan="5">Age group (years)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0&#x2010;24</td><td align="left" valign="top">29 (2.7)</td><td align="left" valign="top">19 (0.7)</td><td align="left" valign="top">48 (1.3)</td><td align="left" valign="top">972 (2.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>25&#x2010;39</td><td align="left" valign="top">76 (7)</td><td align="left" valign="top">87 (3.3)</td><td align="left" valign="top">163 (4.3)</td><td align="left" valign="top">3251 (8.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>40&#x2010;54</td><td align="left" valign="top">204 (18.7)</td><td align="left" valign="top">420 (15.7)</td><td align="left" valign="top">625 (16.6)</td><td align="left" valign="top">8108 (20.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>55&#x2010;64</td><td align="left" valign="top">232 (21.2)</td><td align="left" valign="top">671 (25.1)</td><td align="left" valign="top">904 (24)</td><td align="left" valign="top">8633 (21.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x2265;</named-content>65</td><td align="left" valign="top">552 (50.5)</td><td align="left" valign="top">1476 (55.2)</td><td align="left" valign="top">2026 (53.8)</td><td align="left" valign="top">19,372 (48)</td></tr></tbody></table></table-wrap></sec><sec id="s2-2"><title>Model Architecture</title><p><xref ref-type="fig" rid="figure1">Figure 1</xref> presents an overview of our proposed MSTCL model. We focus on real-time sepsis prediction using only 6 easily obtainable vital signs: oxygen saturation, heart rate, body temperature, systolic blood pressure, diastolic blood pressure, and respiratory rate. As illustrated in <xref ref-type="fig" rid="figure1">Figure 1A</xref>, we collected high-quality, continuous sequences from the original dataset to construct our training and testing datasets. The goal of this study was to design a neural network model capable of predicting the current likelihood of sepsis onset in real time, based on variable-length sequences of these vital signs. To effectively model the relationship between this limited set of vital signs and sepsis onset, we proposed a multiscale temporal dependency modeling architecture, MSTCL (<inline-formula><mml:math id="ieqn1"><mml:msub><mml:mrow><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>), as presented in <xref ref-type="fig" rid="figure1">Figure 1C</xref>, which is equipped with the contrastive learning based on the vital sign sequence representations shown in <xref ref-type="fig" rid="figure1">Figure 1B</xref>.</p><p>Specifically, during training, a given vital sign sequence <inline-formula><mml:math id="ieqn2"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>S</mml:mi><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mn>6</mml:mn></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> is first embedded into <inline-formula><mml:math id="ieqn3"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>X</mml:mi><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>d</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> via a linear layer, <inline-formula><mml:math id="ieqn4"><mml:mi>X</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="ieqn5"><mml:mi>t</mml:mi></mml:math></inline-formula> is the temporal length of the 6D vital signs and <italic>d</italic> is the hidden dimension of the model. Then, the projections for query, key, and value are computed to obtain <inline-formula><mml:math id="ieqn6"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>Q</mml:mi><mml:mo>,</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mi>K</mml:mi><mml:mo>,</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mi>V</mml:mi><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>d</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>, respectively. The attention map <inline-formula><mml:math id="ieqn7"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> is computed as the matrix product between <inline-formula><mml:math id="ieqn8"><mml:mi>Q</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn9"><mml:mi>K</mml:mi></mml:math></inline-formula>.</p><p>To simulate sepsis prediction based solely on the historical vital signs during test time, a causal mask <inline-formula><mml:math id="ieqn10"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> is applied during training. This is achieved via a Hadamard product between <inline-formula><mml:math id="ieqn11"><mml:msub><mml:mrow><mml:mi>M</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn12"><mml:msub><mml:mrow><mml:mi>M</mml:mi></mml:mrow><mml:mrow><mml:mi>C</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, ensuring that the attention mechanism is restricted to time steps prior to the current one (ranging from 1 to <italic>t</italic>), resulting in a lower-triangular matrix as illustrated in <xref ref-type="fig" rid="figure1">Figure 1C</xref>. The global autoencoded representation of the input sequence is then obtained by the following methodology with residual connections and activation functions omitted for clarity:</p><disp-formula id="E1"><label><bold>(1)</bold></label><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>G</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msup><mml:mi>Q</mml:mi><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup><mml:mo>&#x2297;</mml:mo><mml:mi>K</mml:mi><mml:mo>&#x2299;</mml:mo><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2297;</mml:mo><mml:mi>V</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>G</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>d</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>While the transformer was originally proposed to model global dependencies in sequence data, sepsis onset is often correlated with local temporal patterns. Therefore, we introduce a local self-attention branch equipped with a local mask <inline-formula><mml:math id="ieqn13"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>L</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> to capture short-term dependencies. To implement this, earlier history beyond a predefined window is masked, such that each time step can only attend to a limited portion of the past, enabling localized temporal modeling. The local representation is obtained in a similar manner described in equation 1 as <inline-formula><mml:math id="ieqn14"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>L</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mi>d</mml:mi></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>. Finally, the multiscale representation of the vital sign sequence is computed as element-wise addition:</p><disp-formula id="E2"><label><bold>(2)</bold></label><mml:math id="eqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>T</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>S</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>G</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2295;</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>L</mml:mi></mml:mrow></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>Based on this multiscale representation, we proposed a contrastive learning framework to help the model discriminate between septic and nonseptic sequences. Specifically, as shown in <xref ref-type="fig" rid="figure1">Figure 1B</xref>, for any 2 given septic sequences <inline-formula><mml:math id="ieqn15"><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn16"><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, we extract the septic and nonseptic subsequence representations <inline-formula><mml:math id="ieqn17"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn18"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> from <inline-formula><mml:math id="ieqn19"><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, along with its full-sequence representation <inline-formula><mml:math id="ieqn20"><mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, and the septic subsequence representation<inline-formula><mml:math id="ieqn21"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> from <inline-formula><mml:math id="ieqn22"><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. These representations are obtained by performing average pooling on the feature sequences encoded by the proposed MSTCL model (equation 2). For clarity, we omit the subscript <inline-formula><mml:math id="ieqn23"><mml:mi>M</mml:mi><mml:mi>S</mml:mi></mml:math></inline-formula> on these representations.</p><p>Intuitively, the distance between <inline-formula><mml:math id="ieqn24"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn25"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> should be smaller than that between <inline-formula><mml:math id="ieqn26"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn27"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula>, while the distance between <inline-formula><mml:math id="ieqn28"><mml:msubsup><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn29"><mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> should lie in between. This assumption is visualized in the schematic of the representation space in <xref ref-type="fig" rid="figure1">Figure 1B</xref>. We formalize this assumption as a temporal-aware contrastive learning objective and incorporate it into the training process.</p><p>Finally, the sepsis prediction is performed using a linear layer <inline-formula><mml:math id="ieqn30"><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>g</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> followed by a sigmoid activation function to produce the probability of sepsis onset at each time step.</p><disp-formula id="E3"><label><bold>(3)</bold></label><mml:math id="eqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mrow><mml:mi>g</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>,</mml:mo><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overview of the proposed method: (A) The methodology enables online sepsis prediction using only real-time, easily accessible vital signs. (B) Hybrid contrastive learning framework. (C) The autoregressive Multi-Scale Temporal-aware Contrastive Learning (MSTCL) architecture using multiscale causal masks, where darker colors represent lower values.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e82762_fig01.png"/></fig></sec><sec id="s2-3"><title>Model Training and Test</title><p>The training objective of our model consists of 2 main components: a classification loss between the step-by-step sepsis onset predictions (positive or negative) and ground truth labels <inline-formula><mml:math id="ieqn31"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>y</mml:mi><mml:mo>&#x2208;</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x00D7;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>, simulated using a causal mask</p><disp-formula id="E4"><label><bold>(4)</bold></label><mml:math id="eqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mrow><mml:mi mathvariant="fraktur">L</mml:mi></mml:mrow><mml:mrow><mml:mi>p</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>t</mml:mi></mml:mfrac><mml:munderover><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:munderover><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mi>log</mml:mi><mml:mo>&#x2061;</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mi>log</mml:mi><mml:mo>&#x2061;</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mstyle></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>and a contrastive learning loss based on multiscale representations of the vital sign sequences</p><disp-formula id="E5"><label><bold>(5)</bold></label><mml:math id="eqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mtable columnalign="right left right left right left right left right left right left" rowspacing="3pt" columnspacing="0em 2em 0em 2em 0em 2em 0em 2em 0em 2em 0em" displaystyle="true"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi mathvariant="fraktur">L</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mtext>&#x00A0;</mml:mtext></mml:mtd><mml:mtd><mml:mi/><mml:mo movablelimits="true" form="prefix">max</mml:mo><mml:mrow><mml:mo maxsize="1.623em" minsize="1.623em">(</mml:mo></mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mi>d</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mi>d</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msub><mml:mo>&#x25B3;</mml:mo><mml:mrow><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo maxsize="1.623em" minsize="1.623em">)</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd/><mml:mtd><mml:mi/><mml:mo>+</mml:mo><mml:mo movablelimits="true" form="prefix">max</mml:mo><mml:mrow><mml:mo maxsize="1.623em" minsize="1.623em">(</mml:mo></mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mi>d</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>A</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mi>d</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>X</mml:mi><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msub><mml:mo>&#x25B3;</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo maxsize="1.623em" minsize="1.623em">)</mml:mo></mml:mrow><mml:mo>.</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <inline-formula><mml:math id="ieqn32"><mml:msub><mml:mrow><mml:mo>&#x25B3;</mml:mo></mml:mrow><mml:mrow><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>0.25</mml:mn></mml:math></inline-formula><italic>,</italic> <inline-formula><mml:math id="ieqn33"><mml:msub><mml:mrow><mml:mo>&#x25B3;</mml:mo></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>0.2</mml:mn></mml:math></inline-formula> are set in this study by evaluating three configurations (0.2/0.15, 0.25/0.2, and 0.3/0.25), among which the setting of 0.25/0.2 yields the lowest mean absolute error (MAE) value of 0.113; <inline-formula><mml:math id="ieqn34"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>d</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>&#x22C5;</mml:mo><mml:mo>,</mml:mo><mml:mo>&#x22C5;</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> denotes a distance measure, which is Euclidean distance based on L2-normalized features in this study. Our proposed MSTCL model optimized a combined loss that integrates both objectives.</p><disp-formula id="E6"><label><bold>(6)</bold></label><mml:math id="eqn6"><mml:mi mathvariant="script">L</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mi>P</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mi>C</mml:mi></mml:mrow></mml:msub></mml:math></disp-formula><p>The model was implemented using Python (Python Software Foundation) and PyTorch (version 2.1; PyTorch Foundation) and was trained with the Adam optimizer [<xref ref-type="bibr" rid="ref17">17</xref>] with an initial learning rate of 1 &#x00D7; 10<sup>&#x2013;4</sup> for 100 epochs. The proposed MSTCL model contains approximately 0.6 million parameters. Compared with several existing deep learning&#x2013;based methods, such as temporal convolutional networks [<xref ref-type="bibr" rid="ref18">18</xref>] (approximately 0.4 million) and the method described by Li et al [<xref ref-type="bibr" rid="ref19">19</xref>] (approximately 0.45 million), our approach achieved superior performance, even in an online prediction setting, while maintaining a comparable model size. During inference, as illustrated in <xref ref-type="fig" rid="figure1">Figure 1C</xref>, neither of the 2 training losses was required. The model is capable of predicting the likelihood of sepsis onset in real-time, based solely on the newly incoming vital sign values at each time step. The inference latency of our MSTCL was 19 milliseconds with 20 MB VRAM on NVIDIA GTX 1650 Ti (4 GB).</p></sec><sec id="s2-4"><title>Evaluation Metric</title><p>In the testing phase, the model encoded the incoming vital signs sequence and performed step-by-step online prediction of <inline-formula><mml:math id="ieqn35"><mml:mover accent="true"><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula>. When the model predicted a positive case of sepsis, the current sequence is marked as septic, and the difference between the predicted onset and the ground truth is measured using MAE normalized by the input sequence length. If the model does not predict any positive outcome throughout the entire test sequence, the sequence is classified as nonseptic. Accordingly, in addition to MAE, we also used AUROC, area under the precision-recall curve (AUPRC), sensitivity, and specificity to evaluate the model&#x2019;s ability to distinguish between septic and nonseptic sequences. AUROC measures the trade-off between true positive and false positive rates across thresholds. AUPRC focuses on performance under class imbalance by evaluating precision and recall. Sensitivity (true positive rate) assesses the proportion of actual septic cases correctly identified, while specificity (true negative rate) reflects how well the model excludes nonseptic cases.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>The publicly available, fully anonymized PhysioNet Computing in Cardiology 2019 Challenge dataset was used in this study. Our study protocol was approved by the Ethics Committee of Tianjin First Central Hospital, which waived ethical review and informed consent, and all experimental practices conformed to institutional and national human research ethics criteria and the World Medical Association Declaration of Helsinki.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p><xref ref-type="table" rid="table2">Table 2</xref> presents the performance of the proposed method in predicting sepsis onset, measured by AUROC, AUPRC, MAE, sensitivity, and specificity. The reported MAE values are normalized by the input sequence length.</p><p>Specifically, 2 types of temporal modeling strategies were considered: local and global, corresponding to &#x201C;Loc&#x201D; and &#x201C;Glb&#x201D; in the table. For negative sampling in contrastive learning, we compared 2 types: vital sign segments from only negative patients (NegSeq in <xref ref-type="table" rid="table2">Table 2</xref>), and full-length vital sign sequences (WholeSeq in <xref ref-type="table" rid="table2">Table 2</xref>). These served as &#x201C;easy&#x201D; and &#x201C;hard&#x201D; negatives, respectively, relative to the positive sequences derived from patients with sepsis. By performing ablations on these 4 components (eg, Loc, Glb, NegSeq, and WholeSeq), we assessed the individual contributions of each design choice. From the first and second rows of <xref ref-type="table" rid="table2">Table 2</xref>, we observed that even when negative sampling was optimized for contrastive learning, the absence of either local or global temporal modeling substantially degraded performance (eg, AUROC decreased by 22.9 and 20.9 points, respectively, relative to the best-performing configuration). This finding highlights the foundational role of capturing multiscale temporal dependencies in patient vital signs for effective sepsis prediction. Rows 3, 4, and 5 further examine the impact of introducing full-length sequences as harder, transitional negatives. These helped the model learn more discriminative representations by pushing it to distinguish subtle differences in complex temporal patterns. This effect is further demonstrated through visualization analysis.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Effect of main components on the sepsis prediction performance. The results are obtained via the average across 5-fold cross validation.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">AUROC<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>, mean (SD)</td><td align="left" valign="bottom">AUPRC<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>, mean (SD)</td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>, mean (SD)</td><td align="left" valign="bottom">Sensitivity, mean (SD)</td><td align="left" valign="bottom">Specificity, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">Loc<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> + NegSeq<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup> + WholeSeq<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="top">65.39 (0.22)</td><td align="left" valign="top">63.16 (0.25)</td><td align="left" valign="top">0.33 (0.01)</td><td align="left" valign="top">61.10 (0.04)</td><td align="left" valign="top">59.11 (0.04)</td></tr><tr><td align="left" valign="top">Glb<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup> + NegSeq + WholeSeq</td><td align="left" valign="top">67.93 (0.22)</td><td align="left" valign="top">65.69 (0.25)</td><td align="left" valign="top">0.31 (0.01)</td><td align="left" valign="top">62.24 (0.04)</td><td align="left" valign="top">60.92 (0.04)</td></tr><tr><td align="left" valign="top">Loc + Glb</td><td align="left" valign="top">81.34 (0.19)</td><td align="left" valign="top">81.19 (0.22)</td><td align="left" valign="top">0.15 (0.00)</td><td align="left" valign="top">75.42 (0.02)</td><td align="left" valign="top">70.03 (0.02)</td></tr><tr><td align="left" valign="top">Loc + Glb + NegSeq</td><td align="left" valign="top">83.01 (0.18)</td><td align="left" valign="top">82.29 (0.21)</td><td align="left" valign="top">0.12 (0.00)</td><td align="left" valign="top">80.50 (0.02)</td><td align="left" valign="top">70.26 (0.02)</td></tr><tr><td align="left" valign="top">Loc + Glb + NegSeq + WholeSeq</td><td align="left" valign="top"><italic>88.34 (0.13)<sup><xref ref-type="table-fn" rid="table2fn8">h</xref></sup></italic></td><td align="left" valign="top"><italic>86.74 (0.19)</italic></td><td align="left" valign="top"><italic>0.11 (0.00)</italic></td><td align="left" valign="top"><italic>89.29 (0.01)</italic></td><td align="left" valign="top"><italic>73.02 (0.02)</italic></td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p></fn><fn id="table2fn2"><p><sup>b</sup>AUPRC: area under the precision-recall curve.</p></fn><fn id="table2fn3"><p><sup>c</sup>MAE: mean absolute error.</p></fn><fn id="table2fn4"><p><sup>d</sup>Loc: local temporal modeling.</p></fn><fn id="table2fn5"><p><sup>e</sup>NegSeq: vital sign segments from only negative patients.</p></fn><fn id="table2fn6"><p><sup>f</sup>WholeSeq: full-length vital sign sequences.</p></fn><fn id="table2fn7"><p><sup>g</sup>Glb: global temporal modeling.</p></fn><fn id="table2fn8"><p><sup>h</sup>The best results are italicized.</p></fn></table-wrap-foot></table-wrap><p>We applied the t-distributed stochastic neighbor embedding method to visualize the latent representations of patients&#x2019; temporal vital sign data before and after training. As shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>, compared with the pretraining state (<xref ref-type="fig" rid="figure2">Figure 2A</xref>), the full-length vital sign sequences, which include both positive and negative segments, became more distinguishable from purely negative sequences after training (<xref ref-type="fig" rid="figure2">Figure 2B</xref>). This aligns with the natural assumption that full sequences are more similar to positive sequences than to negative sequences. Overall, the combination of multiscale temporal modeling and hierarchical contrastive learning yielded the best predictive performance across all metrics.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>t-distributed stochastic neighbor embedding (t-SNE) visualization of vital sign representations before and after training. (A) Sequence representation before training and (B) sequence representation after training.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e82762_fig02.png"/></fig><p><xref ref-type="fig" rid="figure3">Figure 3</xref> illustrates the stabilization of AUROC, AUPRC, and MAE on the test dataset as the number of training epochs increased. The results cover the first 100 training epochs. All 3 metrics exhibited some fluctuation during the initial 10 epochs. After the 10th epoch, AUROC and AUPRC steadily improved, reaching their peak values, which were 88.3 and 86.7, respectively, around epoch 60, after which they plateaued. Meanwhile, the normalized MAE showed a gradual decline following the 10th epoch, with slightly more fluctuation than AUROC and AUPRC, indicating progressively more accurate predictions of sepsis onset timing. MAE also reached its lowest point around epoch 60, with greater stability in the later training stages compared with earlier ones. One possible reason for the relative instability of MAE is that it is a discrete metric, reflecting the difference between the predicted transition-to-positive point within the model&#x2019;s output sequence and the actual onset time of sepsis.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Visualization of model performance metrics across the training process. AUPRC: area under the precision-recall curve; AUROC: area under the receiver operating characteristic curve; MAE: mean absolute error.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e82762_fig03.png"/></fig><p><xref ref-type="fig" rid="figure4">Figure 4</xref> shows the probability distribution of the normalized prediction error, including the probabilities of correct, early, and delayed predictions among all detected sepsis sample sequences. It can be observed that the most frequent errors occur at a lead of 0.11 and a lag of 0.11, accounting for approximately 16% and 21%, respectively. Predictions that are approximately correct (&#x00B1;0.05) each account for about 8%, indicating that more than 64% of predictions fall within a &#x00B1;0.11 error margin.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Distribution of sepsis prediction errors. Negative errors indicate early predictions before sepsis onset.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e82762_fig04.png"/></fig><p><xref ref-type="table" rid="table3">Table 3</xref> compares the proposed method with existing related works across several key dimensions, including temporal modeling approach (temporal model), task type (manner), the number of training and testing samples used (samples), the number of input vital signs (input), required historical sequence length (history length), and performance metrics such as AUC and MAE. Regarding the evaluation metrics, we introduced MAE specifically to quantify the model&#x2019;s ability to precisely locate the sepsis transition point in a continuous time series. While traditional metrics like AUC evaluate classification accuracy, MAE provides insight into the &#x2018;early warning&#x2019; lead time, which is a unique focus of our MSTCL framework compared with existing single-point prediction methods. Among all methods listed, aside from our proposed approach, the kinematics approach with neural networks for early detection of sepsis (KANNEDS) [<xref ref-type="bibr" rid="ref20">20</xref>] uses the fewest types of input signals. It is based on an LSTM architecture designed for sepsis identification but lacks the capability for real-time onset prediction and requires fixed-length historical sequences. The temporal convolutional network [<xref ref-type="bibr" rid="ref18">18</xref>], on the other hand, supports variable-length input sequences for identifying patients with sepsis but relies on as many as 40 types of input signals and uses the entire original dataset. Zhao et al [<xref ref-type="bibr" rid="ref21">21</xref>] proposed a model based on light gradient boosting machine, achieving the highest AUC among identification tasks, but it still requires fixed-length historical sequences as input. Li et al [<xref ref-type="bibr" rid="ref19">19</xref>] introduced a powerful LSTM+CNN-based model capable of predicting sepsis onset, reaching an AUC of 0.96; however, it requires a large amount of training data to achieve such performance. In contrast, our proposed MSTCL achieves efficient and lightweight online sepsis prediction using only a small set of vital signs and approximately one-tenth of the data required by other methods. This demonstrates the model&#x2019;s strong performance and generalizability even under limited data conditions.</p><p>To further investigate the importance of the selected 6 vital signs, we evaluated the model&#x2019;s sensitivity by systematically masking each input signal (setting its value to zero) during the inference phase and observing the degradation in predictive performance compared with the full-feature model (ALL).</p><p>As verified by the MAE metrics obtained via leave-one-feature-out ablation over 6 vital sign inputs, excluding body temperature yielded the highest MAE (0.18) and triggered the most substantial performance decline, highlighting its critical role in identifying the systemic inflammatory response in sepsis. Removing oxygen saturation, heart rate, and systolic blood pressure separately led to moderate MAE increments of 0.14, 0.15, and 0.13, respectively, while eliminating either diastolic blood pressure or respiratory rate only caused a slight MAE elevation to 0.12; by contrast, incorporating all 6 vital signs achieved the most minimal MAE (0.11). Collectively, these results empirically support the clinical relevance of our 6-feature configuration, which strikes an effective balance between model complexity and predictive power.</p><p>The choice of margins <inline-formula><mml:math id="ieqn36"><mml:msub><mml:mrow><mml:mo>&#x25B3;</mml:mo></mml:mrow><mml:mrow><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn37"><mml:msub><mml:mrow><mml:mo>&#x25B3;</mml:mo></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> is crucial for hierarchical feature learning. The configuration of (0.25, 0.2) achieved the best prediction performance. However, the performance did not vary significantly with the changes in this parameter. Consequently, when applying the proposed MSTCL framework to other datasets, the setting of this parameter is unlikely to become a performance bottleneck.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparison of the proposed model with several related approaches based on the PhysioNet Computing in Cardiology 2019 Challenge dataset.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Methods</td><td align="left" valign="bottom">Temporal model</td><td align="left" valign="bottom">Manner</td><td align="left" valign="bottom">Samples, n</td><td align="left" valign="bottom">Input data dimension</td><td align="left" valign="bottom">History length</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Kinematics approach with neural networks for early detection of sepsis (KANNEDS) [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">LSTM<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">Detect</td><td align="left" valign="top">15,515</td><td align="left" valign="top">8</td><td align="left" valign="top">48 h</td><td align="left" valign="top">0.835</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">Temporal convolutional network [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top">CNN<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="top">Detect</td><td align="left" valign="top">40,336</td><td align="left" valign="top">40</td><td align="left" valign="top">Variable</td><td align="left" valign="top">0.91</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Zhao et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">Light gradient boosting machine</td><td align="left" valign="top">Detect</td><td align="left" valign="top">23,711</td><td align="left" valign="top">25</td><td align="left" valign="top">2,12, 24 h</td><td align="left" valign="top">0.97</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td><td align="left" valign="top">LSTM + CNN</td><td align="left" valign="top">Prediction</td><td align="left" valign="top">40,336</td><td align="left" valign="top">40</td><td align="left" valign="top">11 h</td><td align="left" valign="top">0.964</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">MSTCL<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (proposed model)</td><td align="left" valign="top">Multiscale transformer</td><td align="left" valign="top">Online prediction</td><td align="left" valign="top">3766</td><td align="left" valign="top">6</td><td align="left" valign="top">Variable</td><td align="left" valign="top">0.883</td><td align="left" valign="top">0.11</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>AUC: area under the curve.</p></fn><fn id="table3fn2"><p><sup>b</sup>MAE: mean absolute error.</p></fn><fn id="table3fn3"><p><sup>c</sup>LSTM: long short-term memory.</p></fn><fn id="table3fn4"><p><sup>d</sup>Not reported.</p></fn><fn id="table3fn5"><p><sup>e</sup>CNN: convolutional neural network.</p></fn><fn id="table3fn6"><p><sup>f</sup>MSTCL: Multi-Scale Temporal-aware Contrastive Learning.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>In this study, we developed a lightweight yet effective framework for real-time sepsis prediction using only 6 commonly available vital signs. Our approach integrates a multiscale transformer-based temporal modeling architecture with a novel temporal-aware contrastive learning strategy, enabling accurate online prediction of sepsis with few input features and significantly fewer samples than most prior studies. This design is motivated by the practical challenge that high-frequency laboratory data and rich clinical notes are often unavailable in many health care settings&#x2014;particularly in low-resource environments, emergency departments, and wearable-device applications. Our findings demonstrate that sepsis prediction does not necessarily require complex or high-dimensional inputs, as long as the temporal structure of vital sign data is adequately leveraged.</p><p>The results from our experiments show that both global and local temporal dependencies play crucial roles in modeling the progression toward sepsis onset. Ablation studies indicate that removing either the global or local attention mechanism substantially degrades predictive performance, underscoring the importance of modeling multiscale dynamics in patient vital signs. This is consistent with prior findings that temporal context and resolution are key factors in accurate time-series modeling for health care applications [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. By combining the 2 scales through residual connections, our model captures both longer-term physiological trends and short-term fluctuations, which are often indicators of clinical deterioration.</p><p>Another significant contribution of this work is the introduction of a temporal-aware contrastive learning objective tailored for sepsis trajectory modeling. Unlike standard contrastive learning formulations, which generally rely on static sample augmentations, our framework exploits the natural progression of vital sign sequences by constructing positive, negative, and full-length sequence representations. This hybrid triplet-like structure helps the model better distinguish between subtle temporal variations, especially when labeled data are limited. Similar supervised contrastive approaches have shown promise in related health care domains, such as mortality prediction [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] and patient state representation [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], and our work further demonstrates their applicability in the context of real-time warning tasks.</p><p>Compared with prior studies, our approach requires far fewer training samples. For example, Li et al [<xref ref-type="bibr" rid="ref19">19</xref>] developed a hybrid CNN-LSTM model that achieved a high AUC (up to 0.96) for sepsis onset prediction but required the full MIMIC dataset and numerous laboratory-based inputs. Other models, such as KANNEDS [<xref ref-type="bibr" rid="ref20">20</xref>] or light gradient boosting machine&#x2013;based architectures [<xref ref-type="bibr" rid="ref21">21</xref>], either relied on fixed-length input windows or used up to 40 types of features, limiting their generalizability and real-time applicability. In contrast, our method achieves comparable performance while being trained on fewer than 10% of the original dataset and using only 6 vital signs, significantly expanding its deployment potential.</p><p>A key clinical advantage of our approach is the reliance on only 6 noninvasive vital signs, a strategy aligned with several established models [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. However, we emphasize that the primary innovation of this study is the MSTCL framework itself rather than the specific feature subset. By enforcing contrastive constraints across multiple temporal scales, the framework captures the fine-grained physiological shifts preceding sepsis onset more effectively. This allows our model to bridge the performance gap between limited input and comprehensive input systems, providing a robust tool for high-precision, real-time clinical monitoring.</p><p>Our contrastive visualization results further support the model&#x2019;s ability to learn meaningful representations. As shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>, the latent space representations after training display clearer separability between septic and nonseptic patterns, with full-length sequences positioned between the positive and negative extremes. This aligns with clinical intuition and confirms that our contrastive learning framework facilitates more discriminative embedding learning, especially in scenarios with reduced feature sets.</p><p>Despite these promising results, there are limitations to our study. First, while the model supports variable-length sequences, extremely short sequences (eg, &#x003C;4 hours) may not provide enough temporal context for reliable prediction. Although our model is designed to be robust to input length, future work could explore adaptive mechanisms that adjust attention scope based on data sparsity. Second, our evaluation focuses on binary classification of sepsis onset. Extending the framework to estimate time-to-onset as a survival analysis task or to model continuous deterioration risk could offer additional clinical value.</p><p>Moreover, our current contrastive design relies on predefined segmentations of sequences into septic and nonseptic windows. While effective, this assumes a clear ground truth onset time in the training phase, which in practice can be noisy or inconsistently recorded across institutions. Future iterations could incorporate soft labels or probabilistic sequence labeling to handle uncertainty in sepsis onset annotations.</p><p>From a clinical deployment perspective, the simplicity and efficiency of our model offer distinct advantages. The low computational cost of inference and reliance on readily available vital signs make it suitable for edge deployment on patient monitors or wearable devices. This aligns with broader efforts in ubiquitous health monitoring and early warning systems, where predictive models must operate under resource and latency constraints [<xref ref-type="bibr" rid="ref30">30</xref>]. The interpretability of the model, particularly via attention visualization or representation clustering, is also a promising direction for integration into clinician-facing decision support tools.</p><p>In conclusion, this study presents a novel and efficient framework for online sepsis prediction using only fundamental physiological real-time signals. Through multiscale temporal modeling and contrastive learning, we demonstrate that even with limited data, accurate and timely sepsis detection is achievable. These findings underscore the potential for deploying intelligent monitoring solutions across a wide range of clinical and nonclinical settings, ultimately contributing to better patient outcomes and more efficient resource allocation in critical care.</p></sec></body><back><notes><sec><title>Funding</title><p>This work was supported by the National Key Clinical Specialties Construction Program in Tianjin Health Research Project (grant TJWJ2025ZK007), the Infectious Diseases Department (grant 8235), the Tianjin First Central Hospital Intramural Fund (grant 2025FYQN10), and the Natural Science Foundation of Tianjin (grant 25JCYBJC01350).</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb2">AUPRC</term><def><p>area under the precision-recall curve</p></def></def-item><def-item><term id="abb3">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb4">CNN</term><def><p>convolutional neural network</p></def></def-item><def-item><term id="abb5">ICU</term><def><p>intensive care unit</p></def></def-item><def-item><term id="abb6">KANNEDS</term><def><p>kinematics approach with neural networks for early detection of sepsis</p></def></def-item><def-item><term id="abb7">LSTM</term><def><p>long short-term memory</p></def></def-item><def-item><term id="abb8">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb9">MSTCL</term><def><p>Multi-Scale Temporal-aware Contrastive Learning</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Deutschman</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Seymour</surname><given-names>CW</given-names> </name><etal/></person-group><article-title>The third international consensus definitions for sepsis and septic shock (sepsis-3)</article-title><source>JAMA</source><year>2016</year><month>02</month><day>23</day><volume>315</volume><issue>8</issue><fpage>801</fpage><lpage>810</lpage><pub-id pub-id-type="doi">10.1001/jama.2016.0287</pub-id><pub-id pub-id-type="medline">26903338</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rhee</surname><given-names>C</given-names> </name><name name-style="western"><surname>Dantes</surname><given-names>R</given-names> </name><name name-style="western"><surname>Epstein</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Incidence and trends of sepsis in US hospitals using clinical vs claims data, 2009-2014</article-title><source>JAMA</source><year>2017</year><month>10</month><day>3</day><volume>318</volume><issue>13</issue><fpage>1241</fpage><lpage>1249</lpage><pub-id pub-id-type="doi">10.1001/jama.2017.13836</pub-id><pub-id pub-id-type="medline">28903154</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Villar</surname><given-names>J</given-names> </name><name name-style="western"><surname>Clement</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Stotts</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Many emergency department patients with severe sepsis and septic shock do not meet diagnostic criteria within 3 hours of arrival</article-title><source>Ann Emerg Med</source><year>2014</year><month>07</month><volume>64</volume><issue>1</issue><fpage>48</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.1016/j.annemergmed.2014.02.023</pub-id><pub-id pub-id-type="medline">24680548</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Alexandropoulou</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Panagiotopoulos</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kleanthous</surname><given-names>S</given-names> </name><etal/></person-group><article-title>AI-enabled solutions, explainability and ethical concerns for predicting sepsis in ICUs: a systematic review</article-title><conf-name>2023 IEEE 19th International Conference on e-Science (e-Science)</conf-name><conf-date>Oct 9-13, 2023</conf-date><pub-id pub-id-type="doi">10.1109/e-Science58273.2023.10254863</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stylianides</surname><given-names>C</given-names> </name><name name-style="western"><surname>Nicolaou</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sulaiman</surname><given-names>WA</given-names> </name><etal/></person-group><article-title>AI advances in ICU with an emphasis on sepsis prediction: an overview</article-title><source>Mach Learn Knowl Extr</source><year>2025</year><volume>7</volume><issue>1</issue><fpage>6</fpage><pub-id pub-id-type="doi">10.3390/make7010006</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seymour</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>VX</given-names> </name><name name-style="western"><surname>Iwashyna</surname><given-names>TJ</given-names> </name><etal/></person-group><article-title>Assessment of clinical criteria for sepsis: for the third international consensus definitions for sepsis and septic shock (sepsis-3)</article-title><source>JAMA</source><year>2016</year><month>02</month><day>23</day><volume>315</volume><issue>8</issue><fpage>762</fpage><lpage>774</lpage><pub-id pub-id-type="doi">10.1001/jama.2016.0288</pub-id><pub-id pub-id-type="medline">26903335</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dorsett</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kroll</surname><given-names>M</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Asaro</surname><given-names>P</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Moy</surname><given-names>HP</given-names> </name></person-group><article-title>qSOFA has poor sensitivity for prehospital identification of severe sepsis and septic shock</article-title><source>Prehosp Emerg Care</source><year>2017</year><volume>21</volume><issue>4</issue><fpage>489</fpage><lpage>497</lpage><pub-id pub-id-type="doi">10.1080/10903127.2016.1274348</pub-id><pub-id pub-id-type="medline">28121217</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Usman</surname><given-names>OA</given-names> </name><name name-style="western"><surname>Usman</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Ward</surname><given-names>MA</given-names> </name></person-group><article-title>Comparison of SIRS, qSOFA, and NEWS for the early identification of sepsis in the emergency department</article-title><source>Am J Emerg Med</source><year>2019</year><month>08</month><volume>37</volume><issue>8</issue><fpage>1490</fpage><lpage>1497</lpage><pub-id pub-id-type="doi">10.1016/j.ajem.2018.10.058</pub-id><pub-id pub-id-type="medline">30470600</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nemati</surname><given-names>S</given-names> </name><name name-style="western"><surname>Holder</surname><given-names>A</given-names> </name><name name-style="western"><surname>Razmi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Stanley</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Clifford</surname><given-names>GD</given-names> </name><name name-style="western"><surname>Buchman</surname><given-names>TG</given-names> </name></person-group><article-title>An interpretable machine learning model for accurate prediction of sepsis in the ICU</article-title><source>Crit Care Med</source><year>2018</year><month>04</month><volume>46</volume><issue>4</issue><fpage>547</fpage><lpage>553</lpage><pub-id pub-id-type="doi">10.1097/CCM.0000000000002936</pub-id><pub-id pub-id-type="medline">29286945</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rafiei</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rezaee</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hajati</surname><given-names>F</given-names> </name><name name-style="western"><surname>Gheisari</surname><given-names>S</given-names> </name><name name-style="western"><surname>Golzan</surname><given-names>M</given-names> </name></person-group><article-title>SSP: early prediction of sepsis using fully connected LSTM-CNN model</article-title><source>Comput Biol Med</source><year>2021</year><month>01</month><volume>128</volume><fpage>104110</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2020.104110</pub-id><pub-id pub-id-type="medline">33227577</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheng</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Kung</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>FC</given-names> </name><etal/></person-group><article-title>Machine learning models for predicting in-hospital mortality in patient with sepsis: analysis of vital sign dynamics</article-title><source>Front Med (Lausanne)</source><year>2022</year><volume>9</volume><fpage>964667</fpage><pub-id pub-id-type="doi">10.3389/fmed.2022.964667</pub-id><pub-id pub-id-type="medline">36341257</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Vaswani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shazeer</surname><given-names>N</given-names> </name><name name-style="western"><surname>Parmar</surname><given-names>N</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>von Luxburg</surname><given-names>U</given-names> </name><name name-style="western"><surname>Guyon</surname><given-names>I</given-names> </name><name name-style="western"><surname>Bengio</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wallach</surname><given-names>H</given-names> </name><name name-style="western"><surname>Fergus</surname><given-names>R</given-names> </name></person-group><article-title>Attention is all you need</article-title><source>NIPS&#x2019;17: Proceedings of the 31st International Conference on Neural Information Processing Systems</source><year>2017</year><publisher-name>Curran Associates Inc</publisher-name><pub-id pub-id-type="other">9781510860964</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name></person-group><article-title>A time series driven model for early sepsis prediction based on transformer module</article-title><source>BMC Med Res Methodol</source><year>2024</year><month>01</month><day>25</day><volume>24</volume><issue>1</issue><fpage>23</fpage><pub-id pub-id-type="doi">10.1186/s12874-023-02138-6</pub-id><pub-id pub-id-type="medline">38273257</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>P</given-names> </name><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><name name-style="western"><surname>Quan</surname><given-names>SF</given-names> </name><etal/></person-group><article-title>A transformer-based diffusion probabilistic model for heart rate and blood pressure forecasting in intensive care unit</article-title><source>Comput Methods Programs Biomed</source><year>2024</year><month>04</month><volume>246</volume><fpage>108060</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2024.108060</pub-id><pub-id pub-id-type="medline">38350189</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Pollard</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>L</given-names> </name><etal/></person-group><article-title>MIMIC-III, a freely accessible critical care database</article-title><source>Sci Data</source><year>2016</year><month>05</month><day>24</day><volume>3</volume><fpage>160035</fpage><pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id><pub-id pub-id-type="medline">27219127</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reyna</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Josef</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Jeter</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Early prediction of sepsis from clinical data: the PhysioNet/Computing in Cardiology Challenge 2019</article-title><source>Crit Care Med</source><year>2020</year><month>02</month><volume>48</volume><issue>2</issue><fpage>210</fpage><lpage>217</lpage><pub-id pub-id-type="doi">10.1097/CCM.0000000000004145</pub-id><pub-id pub-id-type="medline">31939789</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Kingma</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Ba</surname><given-names>J</given-names> </name></person-group><article-title>Adam: a method for stochastic optimization</article-title><source>arXiv</source><comment>Preprint posted online on  Dec 22, 2014</comment><pub-id pub-id-type="doi">10.48550/arXiv.1412.6980</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kok</surname><given-names>C</given-names> </name><name name-style="western"><surname>Jahmunah</surname><given-names>V</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>SL</given-names> </name><etal/></person-group><article-title>Automated prediction of sepsis using temporal convolutional network</article-title><source>Comput Biol Med</source><year>2020</year><month>12</month><volume>127</volume><fpage>103957</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2020.103957</pub-id><pub-id pub-id-type="medline">32938540</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name><name name-style="western"><surname>Andr&#x00E9; Ng</surname><given-names>G</given-names> </name><name name-style="western"><surname>Schlindwein</surname><given-names>F</given-names> </name></person-group><article-title>Convolutional and recurrent neural networks for early detection of sepsis using hourly physiological data from patients in intensive care unit</article-title><conf-name>2019 Computing in Cardiology Conference</conf-name><conf-date>Sep 8-11, 2019</conf-date><pub-id pub-id-type="doi">10.22489/CinC.2019.054</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cruz</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Ono</surname><given-names>N</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Altaf-Ul-Amin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kanaya</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cavalcante</surname><given-names>C</given-names> </name></person-group><article-title>Kinematics approach with neural networks for early detection of sepsis (KANNEDS)</article-title><source>BMC Med Inform Decis Mak</source><year>2021</year><month>05</month><day>20</day><volume>21</volume><issue>1</issue><fpage>163</fpage><pub-id pub-id-type="doi">10.1186/s12911-021-01529-3</pub-id><pub-id pub-id-type="medline">34016115</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>G</given-names> </name></person-group><article-title>Early prediction of sepsis based on machine learning algorithm</article-title><source>Comput Intell Neurosci</source><year>2021</year><volume>2021</volume><fpage>6522633</fpage><pub-id pub-id-type="doi">10.1155/2021/6522633</pub-id><pub-id pub-id-type="medline">34675971</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Patharkar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>F</given-names> </name><name name-style="western"><surname>Al-Hindawi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>T</given-names> </name></person-group><article-title>Predictive modeling of biomedical temporal data in healthcare applications: review and future directions</article-title><source>Front Physiol</source><year>2024</year><volume>15</volume><fpage>1386760</fpage><pub-id pub-id-type="doi">10.3389/fphys.2024.1386760</pub-id><pub-id pub-id-type="medline">39473609</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Manashty</surname><given-names>A</given-names> </name><name name-style="western"><surname>Light</surname><given-names>J</given-names> </name></person-group><article-title>Life model: a novel representation of life-long temporal sequences in health predictive analytics</article-title><source>Future Gener Comput Syst</source><year>2019</year><month>03</month><volume>92</volume><fpage>141</fpage><lpage>156</lpage><pub-id pub-id-type="doi">10.1016/j.future.2018.09.033</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Qin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Salim</surname><given-names>FD</given-names> </name><name name-style="western"><surname>Yepes</surname><given-names>AJ</given-names> </name></person-group><article-title>Contrastive learning-based imputation-prediction networks for in-hospital mortality risk modeling using EHRs</article-title><source>Machine Learning and Knowledge Discovery in Databases: Applied Data Science and Demo Track</source><year>2023</year><publisher-name>Springer Nature</publisher-name></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wanyan</surname><given-names>T</given-names> </name><name name-style="western"><surname>Honarvar</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jaladanki</surname><given-names>SK</given-names> </name><etal/></person-group><article-title>Contrastive learning improves critical event prediction in COVID-19 patients</article-title><source>Patterns (N Y)</source><year>2021</year><month>12</month><day>10</day><volume>2</volume><issue>12</issue><fpage>100389</fpage><pub-id pub-id-type="doi">10.1016/j.patter.2021.100389</pub-id><pub-id pub-id-type="medline">34723227</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Alavi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name></person-group><article-title>Self-supervised contrastive learning for medical time series: a systematic review</article-title><source>Sensors (Basel)</source><year>2023</year><volume>23</volume><issue>9</issue><fpage>4221</fpage><pub-id pub-id-type="doi">10.3390/s23094221</pub-id><pub-id pub-id-type="medline">37177423</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Y&#x00E8;che</surname><given-names>H</given-names> </name><name name-style="western"><surname>Dresdner</surname><given-names>G</given-names> </name><name name-style="western"><surname>Locatello</surname><given-names>F</given-names> </name><name name-style="western"><surname>H&#x00FC;ser</surname><given-names>M</given-names> </name><name name-style="western"><surname>R&#x00E4;tsch</surname><given-names>G</given-names> </name></person-group><article-title>Neighborhood contrastive learning applied to online patient monitoring</article-title><source>Proc Mach Learn Res</source><year>2021</year><access-date>2026-06-03</access-date><volume>139</volume><fpage>11964</fpage><lpage>11974</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.mlr.press/v139/yeche21a.html">https://proceedings.mlr.press/v139/yeche21a.html</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mao</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Jay</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hoffman</surname><given-names>JL</given-names> </name><etal/></person-group><article-title>Multicentre validation of a sepsis prediction algorithm using only vital sign data in the emergency department, general ward and ICU</article-title><source>BMJ Open</source><year>2018</year><month>01</month><day>26</day><volume>8</volume><issue>1</issue><fpage>e017833</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2017-017833</pub-id><pub-id pub-id-type="medline">29374661</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giordano</surname><given-names>M</given-names> </name><name name-style="western"><surname>Dheman</surname><given-names>K</given-names> </name><name name-style="western"><surname>Magno</surname><given-names>M</given-names> </name></person-group><article-title>SepAl: sepsis alerts on low-power wearables with digital biomarkers and on-device tiny machine learning</article-title><source>IEEE Sensors J</source><year>2025</year><volume>25</volume><issue>5</issue><fpage>7858</fpage><lpage>7866</lpage><pub-id pub-id-type="doi">10.1109/JSEN.2024.3424655</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaik</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Higgins</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Remote patient monitoring using artificial intelligence: current state, applications, and challenges</article-title><source>WIREs Data Mining Knowl Discov</source><year>2023</year><month>03</month><fpage>e1485</fpage><pub-id pub-id-type="doi">10.1002/widm.1485</pub-id></nlm-citation></ref></ref-list></back></article>