<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e79929</article-id><article-id pub-id-type="doi">10.2196/79929</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Development Process of a Clinical Decision Support System for Empiric Antibiotic Therapies in Patients With Sepsis: Case Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Schmiegel</surname><given-names>Sophie</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Marchi</surname><given-names>Hannah</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hege</surname><given-names>Philipp</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Elkenkamp</surname><given-names>Svenja</given-names></name><degrees>MEd, MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Duevel</surname><given-names>Juliane</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>D&#x00FC;sing</surname><given-names>Christoph</given-names></name><degrees>Dr rer nat</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Greiner</surname><given-names>Wolfgang</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Scholz</surname><given-names>Sean Selim</given-names></name><degrees>Priv-Doz, Dr med, MHBA</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Witzke</surname><given-names>Dominic</given-names></name><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tebbe</surname><given-names>Johannes J</given-names></name><degrees>Prof Dr med</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wehmeier</surname><given-names>Michael</given-names></name><degrees>Dr med Dipl-Biochem</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kaup</surname><given-names>Olaf</given-names></name><degrees>Dr rer nat Dipl-Biochem</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Borgstedt</surname><given-names>Rainer</given-names></name><degrees>Dr med</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rehberg</surname><given-names>Sebastian</given-names></name><degrees>Prof Dr med</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cimiano</surname><given-names>Philipp</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Fuchs</surname><given-names>Christiane</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff8">8</xref></contrib></contrib-group><aff id="aff1"><institution>Data Science Group, Faculty of Business Administration and Economics, Bielefeld University</institution><addr-line>Universit&#x00E4;tsstra&#x00DF;e 25, North Rhine-Westphalia</addr-line><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff2"><institution>AG 5 - Health Economics and Health Care Management, School of Public Health, Bielefeld University</institution><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff3"><institution>Centre for electronic Public Health Research (CePHR),, School of Public Health, Bielefeld University</institution><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff4"><institution>Center for Cognitive Interaction Technology (CITEC), Faculty of Technology, Bielefeld University</institution><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff5"><institution>Department of Anaesthesiology, Intensive Care, Emergency Medicine, Transfusion Medicine and Pain Therapy, Medical School and University Medical Center OWL, Bielefeld University, Protestant Hospital of the Bethel Foundation</institution><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff6"><institution>Division of Internal Medicine, Department of Gastroenterology and Infectiology, Medical School and University Medical Center OWL, Bielefeld University, Klinikum Lippe</institution><addr-line>Detmold</addr-line><country>Germany</country></aff><aff id="aff7"><institution>Institute of Laboratory Medicine, Microbiology and Transfusion Medicine, Klinikum Bielefeld</institution><addr-line>Bielefeld</addr-line><country>Germany</country></aff><aff id="aff8"><institution>Institute of Computational Biology, Computational Health Center, Helmholtz Munich</institution><addr-line>Oberschlei&#x00DF;heim</addr-line><country>Germany</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Nowak</surname><given-names>Hartmuth</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Schwermer</surname><given-names>Heinzpeter</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Okunbor</surname><given-names>Opeyemi</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Christiane Fuchs, Prof Dr, Data Science Group, Faculty of Business Administration and Economics, Bielefeld University, Universit&#x00E4;tsstra&#x00DF;e 25, North Rhine-Westphalia, Bielefeld, 33615, Germany, 49 521 106 2576; <email>christiane.fuchs@uni-bielefeld.de</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>13</day><month>5</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e79929</elocation-id><history><date date-type="received"><day>08</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>06</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>06</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Sophie Schmiegel, Hannah Marchi, Philipp Hege, Svenja Elkenkamp, Juliane Duevel, Christoph D&#x00FC;sing, Wolfgang Greiner, Sean Selim Scholz, Dominic Witzke, Johannes J Tebbe, Michael Wehmeier, Olaf Kaup, Rainer Borgstedt, Sebastian Rehberg, Philipp Cimiano, Christiane Fuchs. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 13.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2026/1/e79929"/><abstract><sec><title>Background</title><p>Antibiotic therapies are the main treatment for bacterial infections, but growing antibiotic resistance is a major global health threat, severely impacting patients with sepsis. Rapid selection of the most effective antibiotic therapy is critical for survival and for preventing further resistance. Physicians must consider numerous factors for proper empiric treatment selection. A clinical decision support system (CDSS) aims to support physicians in this process, facilitating rapid and targeted therapy.</p></sec><sec><title>Objective</title><p>The purpose of this work is to explore the extent to which the realization of a CDSS is possible based on the data available to us and to document insights gained during the development of a foundational model designed to assist physicians in determining empiric treatment options for patients with sepsis. In this regard, rather than aiming to develop a CDSS for clinical application, we highlight the importance of close interprofessional collaboration between scientists from various disciplines and analyze the effects of data quality and quantity on the performance of our statistical models.</p></sec><sec sec-type="methods"><title>Methods</title><p>Empirical scientists conducted interviews with medical practitioners to acquire the medical knowledge required to develop sound statistical models. We developed and applied 2-step cross-sectional, as well as time-series classification models, to carefully preprocessed data of patients with sepsis admitted to the intensive care unit of a German hospital.</p></sec><sec sec-type="results"><title>Results</title><p>We identified several factors as crucial information for valid decisions on empiric therapy for treating patients with sepsis. These include the patients&#x2019; core data, especially the infection focus. To prevent further resistance, individual risk factors such as travel history and professional background should be considered. The evaluation of a therapy&#x2019;s effectiveness is mainly based on the patient&#x2019;s general condition and blood values such as procalcitonin and interleukin 6. One key factor in the acceptance of a CDSS is the explainability of the results produced by the applied methods. Our models demonstrated mainly weak predictive ability for all considered empiric antibiotic therapies. However, they are not yet suitable for use in clinical practice, especially as they are based on prescribing habits rather than on optimal treatment decisions.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This work highlights the importance of interprofessional collaboration between medical experts and model developers, ensuring that data quality and clinical relevance are central to the process. It emphasizes the urgent need for high-quality, comprehensive data to overcome challenges such as data discontinuity and improve model performance, particularly through enhanced digitization in health care. This feasibility study will facilitate future efforts to develop a CDSS for treating patients with sepsis and to translate it into clinical use.</p></sec></abstract><kwd-group><kwd>antibiotic prescription</kwd><kwd>antibiotic resistances</kwd><kwd>clinical decision support system</kwd><kwd>multiclass classification</kwd><kwd>sepsis</kwd><kwd>time series classification</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Motivation</title><p>Antibiotic therapies represent a milestone within pharmacological and clinical research and are commonly used in the treatment of bacterial infections ranging from mild cystitis to life-threatening sepsis. Sepsis is a severe and rapidly progressing course of a bacterial infection that needs to be treated within the first 3 hours after diagnosis to increase the chances of patient survival [<xref ref-type="bibr" rid="ref1">1</xref>]. The chance of treatment success rises with increased coverage of pathogens; thus, the Surviving Sepsis Campaign Guidelines for Management of Sepsis and Septic Shock 2021 [<xref ref-type="bibr" rid="ref1">1</xref>] recommend a broad-spectrum antibiotic as empiric (ie, the initial) therapy. Accordingly, German hospital guidelines recommend the use of a broad-spectrum antibiotic, in particular if the focus of infection is unknown. While broad-spectrum antibiotics are likely to be effective, they come with a variety of side effects, such as gastrointestinal complaints and drug fever [<xref ref-type="bibr" rid="ref2">2</xref>], and harbor the risk of developing antibiotic resistance [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Such resistance poses a global threat to health care systems [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Thus, an important goal is to minimize the use of broad-spectrum antibiotics. A direct point of action for this is inappropriate prescriptions, for example, in the case of viral infections [<xref ref-type="bibr" rid="ref7">7</xref>], and still common self-prescriptions due to low-threshold access to antibiotics [<xref ref-type="bibr" rid="ref8">8</xref>]. Overall, preventing the development of further resistance requires consistent antibiotic stewardship and support in selecting targeted antibiotic therapies. The latter is particularly difficult in the case of severe disorders such as sepsis, which are the focus of this work. Even for experienced physicians, the diagnosis and treatment of sepsis are challenging tasks [<xref ref-type="bibr" rid="ref9">9</xref>].</p></sec><sec id="s1-2"><title>Background</title><sec id="s1-2-1"><title>Project Background</title><p>This work has emerged from and shows an excerpt of the research in the interprofessional project &#x201C;KINBIOTICS&#x201D; [<xref ref-type="bibr" rid="ref10">10</xref>], funded by the German Federal Ministry of Health from 2020 to 2024. An overarching objective of the &#x201C;KINBIOTICS&#x201D; consortium project was to develop an artificial intelligence (AI)&#x2013;based clinical decision support system (CDSS) for the individualized prediction of targeted, effective antibiotic therapies with low side effects for patients with sepsis. Such a CDSS would help clinicians make rapid and targeted treatment decisions and thus save lives and reduce the progressive occurrence of antimicrobial resistance. Additionally, the process of developing a data-driven CDSS has the potential to reveal previously unconsidered patterns in the data, thereby providing substantial benefits to the current prescription process.</p><p>Research in the &#x201C;KINBIOTICS&#x201D; project was conducted by medical practitioners and empirical scientists from various disciplines, including information technology, data science, biotechnology, health sciences, and medicine. The scientists were affiliated with 5 institutions, namely Bielefeld University, University of Siegen, Evangelisches Klinikum Bethel, Klinikum Bielefeld, and Klinikum Lippe. The project was organized in work packages addressing a range of topics, including the prediction of the pathogen and resistance spectrum by nanopore sequencing [<xref ref-type="bibr" rid="ref11">11</xref>], the setup of a data warehouse including the creation of preconditions for federated learning [<xref ref-type="bibr" rid="ref12">12</xref>], the development of a resistance observatory [<xref ref-type="bibr" rid="ref13">13</xref>], evaluation of a pilot CDSS [<xref ref-type="bibr" rid="ref14">14</xref>], statistical model building as a basis for the CDSS, and the support system&#x2019;s integration into clinical routine [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>To achieve the project goals, model constructors and medical professionals were in close dialogue with each other, and this turned out to be particularly helpful for the process of data selection, data preprocessing, and statistical model fitting. In the following, we focus on this process and the steps we found essential to be taken before the development of an AI-based CDSS.</p></sec><sec id="s1-2-2"><title>Sepsis</title><p>Sepsis is one of the main causes of illness and death all over the world. In 2017, an estimated 48.9 million incident cases of sepsis were recorded worldwide, and 11.0 million sepsis-related deaths were reported, representing 19.7% of all global deaths [<xref ref-type="bibr" rid="ref16">16</xref>]. Therefore, the World Health Organization (WHO) urged its members through a resolution to include prevention, diagnosis, and treatment of sepsis in national health care systems and to develop and implement standard and optimal care for diagnosing and managing sepsis in health emergencies [<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>Sepsis has been defined as a life-threatening organ dysfunction caused by a dysregulated host response to infection (Sepsis-3 definition) [<xref ref-type="bibr" rid="ref18">18</xref>]. The infection can be caused by most types of microorganisms, including bacteria, fungi, viruses, and parasites [<xref ref-type="bibr" rid="ref19">19</xref>]. Organ dysfunction is characterized using the sequential organ failure assessment (SOFA) score [<xref ref-type="bibr" rid="ref20">20</xref>], including 6 organ systems (respiratory, coagulation, liver, cardiovascular, central nervous system, and renal) with a rise of at least 2 points following the infection. The most severe state of sepsis is defined as septic shock with persistent hypotension requiring vasopressor therapy and a serum lactate level of more than 2 mmol/L despite adequate volume resuscitation. This status is characterized by circulatory, cellular, and metabolic abnormalities leading to an increased mortality of up to 40% [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>According to the resolution of the WHO, international scientific organizations started the Surviving Sepsis Campaign in 2002, developing guidelines for the treatment of sepsis and septic shock [<xref ref-type="bibr" rid="ref1">1</xref>]. According to these guidelines, sepsis and septic shock are medical emergencies requiring rapid diagnosis and immediate treatment. Consequently, the following measures should be carried out as quickly as possible: measurement of the lactate level, antibiotic susceptibility testing, administration of broad-spectrum antibiotics, initiation of appropriate fluid administration and vasopressors if necessary, and remeasurement of the lactate level. In particular, the administration of antibiotics should not be delayed or fail to target the pathogen. The rationale behind these measures is that the time until effective antimicrobial therapy is a crucial determinant of survival in septic shock [<xref ref-type="bibr" rid="ref21">21</xref>]: a delay in the initiation of effective antimicrobial therapy is associated with a mean decrease in survival of 7.6% per hour.</p><p>In clinical practice, the microbiological proof of the pathogen causing sepsis or septic shock is most often missing at the time of diagnosis. Therefore, the initial administration of antibiotics is empiric and generally follows the Tarragona strategy first described by Sandiumenge et al [<xref ref-type="bibr" rid="ref22">22</xref>]. The principles of this therapy involve assessing patients and their risk factors to &#x201C;hit hard and early&#x201D;, aiming at an immediate administration of an effective dose of antibiotics while considering the local antimicrobial situation. It also includes accurately identifying the site of infection and understanding the pharmacodynamics and pharmacokinetics of the antibiotics. Furthermore, it is essential to remain focused by continually reevaluating the effectiveness of administered antibiotics. Finally, the treatment should be de-escalated accordingly after identifying the pathogen.</p></sec></sec><sec id="s1-3"><title>Focus of This Work</title><p>Many disciplines aim to improve antibiotic therapies, including microbiology, pharmacology, chemistry, and clinical research. Research and knowledge transfer can be significantly more effective when they operate across disciplinary boundaries and connect fundamental research with clinical practice. In our work, we specifically focus on the interprofessional work between scientists from various disciplines with empirical and clinical backgrounds on the way to a CDSS for antibiotic treatment, which is an information system designed to assist (but not replace) physicians in making empiric treatment decisions for patients with sepsis. The particular value of our contribution arises from the close collaboration between disciplines and the integration of guidelines, constraints, and clinical experience into data analysis. We refrain from pursuing the development of a CDSS for widespread use in clinical practice. Instead, the paper constitutes a feasibility study and consolidates insights obtained during the development process to provide guidance for projects with comparable objectives. We describe preparatory steps required before the construction of statistical models used for a CDSS and model physicians&#x2019; decisions regarding empiric antibiotic therapy. In this regard, we highlight the relevance of high data quality and close exchange between medical experts and model constructors.</p></sec><sec id="s1-4"><title>State of Research</title><p>The causes, diagnosis, treatment, and consequences of sepsis are highly relevant in various fields of research. In line with the focus of our work, machine learning and deep learning have commonly been applied to analyze data of patients with sepsis. In particular, numerous studies cover the early and accurate prediction of the onset of sepsis, for example [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref27">27</xref>], and Moor et al [<xref ref-type="bibr" rid="ref28">28</xref>] provide a systematic literature review for early prediction of sepsis in intensive care units (ICUs). Further, many studies pursue the goal of predicting antimicrobial resistance. The literature review by [<xref ref-type="bibr" rid="ref29">29</xref>] identified 12 studies that use machine learning in the context of antibiotic susceptibility pattern prediction (eg, [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]). Additionally, Sakagianni et al [<xref ref-type="bibr" rid="ref29">29</xref>] selected 8 studies on machine learning&#x2013;assisted antibiotic resistance prediction (eg, [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]). Paul et al [<xref ref-type="bibr" rid="ref36">36</xref>] developed a computerized decision support system to predict appropriate antibiotic therapies to avoid the use of broad-spectrum antibiotics for treatment of infectious diseases. This study also considered the benefits of antibiotics (eg, reduction in the length of hospital stay) as well as costs (eg, adverse events). Such CDSS may also be beneficial for patients with sepsis, in particular in assisting physicians in selecting a proper empiric antibiotic therapy.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Acquisition and Preprocessing</title><sec id="s2-1-1"><title>Medical Knowledge Compilation</title><p>As described in the Focus of This Work subheading, we attributed great importance to interprofessional collaboration to appropriately meet the challenges of adequate treatment of sepsis, a multifaceted complication of an infection. Consequently, medical practitioners and empirical scientists maintained continuous dialogue to ensure a deep and comprehensive understanding of both the medical processes and the methodological requirements. This knowledge exchange aimed to guarantee that decisions made during data preprocessing and statistical model construction were congruent with the clinical procedure.</p><p>On the operational level, the empirical scientists conducted a series of interviews with predefined questions with representatives of the 3 participating hospitals, including physicians working at the bedside of patients with sepsis. In this way, nonclinicians were given a comprehensive overview of treatment options and guidelines, and relevant stakeholders were engaged at all stages of the CDSS development process.</p><p>In an initial interview series, 2 aspects were of primary interest: first, the nature and use of broad-spectrum antibiotics, along with aspects of combination therapies; second, the evaluation process for the effectiveness of administered therapies and the critical factors that influenced this evaluation. In 2 further series of interviews, we focused on relevant determinants of successful implementation of a CDSS in clinical routine settings by assessing the clinicians&#x2019; general acceptance of such a system and identifying necessary information to be provided to make it as trustworthy as possible. In addition to the interviews, we conducted biweekly meetings between representatives from the hospitals and data scientists. Further, all 3 hospitals provided their internal guidelines for antibiotic administration and dosage depending on diagnosis and identified pathogens. This facilitated the data scientists&#x2019; understanding of the specific procedures and decision-making processes. <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the overall project process, with a focus on statistical model development.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Schematic representation of the process within the &#x201C;KINBIOTICS&#x201D; project aimed at modeling physicians&#x2019; decision-making for empiric antibiotic therapy in patients with sepsis. CDSS: clinical decision support system.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e79929_fig01.png"/></fig></sec><sec id="s2-1-2"><title>Data</title><p>We use retrospective health records from patients admitted to the ICU of the German hospital Evangelisches Klinikum Bethel between 2012 and 2023. All patients in this dataset were admitted to an intensive or intermediate care unit and diagnosed with sepsis or septic shock (in particular, they were diagnosed with one of the <italic>ICD-10</italic> (<italic>International Statistical Classification of Diseases, Tenth Revision</italic>) [<xref ref-type="bibr" rid="ref37">37</xref>] codes: A40.0, A40.1, A40.2, A40.3, A40.8, A40.9, A41.0, A41.1, A41.2, A41.3, A41.4, A41.51, A41.52, A41.58, A41.8, A41.9, R57.2, or R65.1. The data were derived from 3 sources: first, the clinical information system included time-constant core data and diagnoses, as well as blood values and vital signs measured over the period of hospitalization. Second, the patient data management system contained the administration of catecholamines and antibiotics over time. Third, information about microbiology analyses was available from the hospital&#x2019;s laboratory, representing results of antibiotic susceptibility testing based on patient samples such as blood, urine, or smear. However, data on administered catecholamines and microbiological analyses were not included in the analyses, as microbiology data, in particular, were not available at the time of diagnosis.</p><p>Before data analysis, we carefully preprocessed the data. As a first step, we excluded patients who did not receive any antibiotic therapy or who had not yet reached the age of 18 years at the time of admission. In collaboration with medical experts, erroneous values in variables such as age, height, and weight were either adjusted or removed, and thresholds for blood values and vital signs were included in accordance with medical recommendations. The suspected focus of infection was not documented in the available data. However, given its potential importance for addressing the research question, we derived the suspected infection focus from patients&#x2019; <italic>ICD-10</italic> codes. To this end, a medical expert categorized all sepsis-related <italic>ICD-10</italic> codes from the clinical information system database according to their infection focus. This procedure resulted in many patients having more than one suspected infection focus. Consequently, we split the foci per patient into several variables, taking into account the order of occurrence. For further analysis, however, we exclusively used the first focus and refer to it as the suspected infection focus on the remainder of this text.</p><p>A complication occurred because the time point of diagnosis was only insufficiently documented in the patients&#x2019; records. Consequently, we assumed that the time of sepsis diagnosis corresponded to the time of the initial antibiotic administration; this serves as an approximation that appears to be adequate to fulfill the objective of this work. Additionally, some patients were represented several times in the dataset. They were either repeatedly admitted to the hospital or had multiple infections during one hospital stay. In particular, there were 2482 individual patients with a total of 2986 infections, resulting from up to 6 infections per patient. We divided one hospital stay into 2 separate stays when no antibiotic was administered for at least 5 days, and there was a change in the infection focus during that time. Henceforth, for simplicity, we use the term &#x201C;patients&#x201D; in place of &#x201C;infections&#x201D;, even in cases where a single patient is represented by multiple infections in the dataset.</p><p>The obtained dataset is presented as follows: core data were available for 2986 patients and contained 26 variables. The age of the patients ranged from 18 to 99 years, with an average age of 67.56 years; approximately 36% (n=1067) of patients were female. A total of 1257 (42%) of all patients died during the hospital stay. The aforementioned categorization to derive the suspected infection focus ultimately yielded the following 16 categories (with the number of occurrences in brackets): lungs (n=1074); urogenital tract (n=498); gastrointestinal tract (n=353); prosthesis inflammation (n=175); skin or muscle (n=118); bile (n=101); brain (n=82); bones, joints, tendons, or intervertebral discs (n=60); heart (n=34); vessels (n=14); liver (n=11); ear, nose, or throat (n=10); esophagus (n=8); oral cavity (n=3); spleen (n=1); and eye (n=1). For all patients, time series of vital signs and blood values (31 variables) were available from a maximum of 88 days before and up to 1610 days after the date of diagnosis. However, the measurement and documentation of time series variables were carried out with varying quantities and frequencies. <xref ref-type="table" rid="table1">Table 1</xref> lists all available variables. Diagnoses were documented for 2945 patients with 3319 unique <italic>ICD-10</italic> codes in total; 24 of these were connected to sepsis or septic shock. In addition to these <italic>ICD-10</italic> codes, we had information about whether a patient had diabetes or required dialysis; further information about possible comorbidities was not available. Further, the data included information about administered antibiotics, including drug names as well as therapy start and end dates, for all patients. A total of 35 distinct antibiotics were administered at least once. We define the first antibiotic administered to a patient (during diagnosis or afterwards) as empiric. An overview of all antibiotics and their frequencies is provided in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Description of the variables contained in the preprocessed dataset.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Source and variable</td><td align="left" valign="bottom">Unit</td><td align="left" valign="bottom">Description</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Core data</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Infection ID</td><td align="char" char="." valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">Unique identifier per infection and patient</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Admission date</td><td align="left" valign="top">Date</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Discharge date</td><td align="left" valign="top">Date</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Suspected time of diagnosis</td><td align="left" valign="top">Date</td><td align="left" valign="top">Documented date or time point of first administration of antibiotic treatment</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age</td><td align="left" valign="top">Years</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sex</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Male or female</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diabetes</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient has diabetes (&#x201C;yes&#x201D; or &#x201C;no&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Death</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient died during hospital stay (&#x201C;yes&#x201D; or &#x201C;no&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Weight</td><td align="left" valign="top">kg</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Height</td><td align="left" valign="top">cm</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>BMI</td><td align="left" valign="top">kg/m<sup>2</sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Suspected infection focus</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Suspected source of the infection (16 different categories)</td></tr><tr><td align="left" valign="top" colspan="3">Time series data</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Infection ID</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Unique identifier per infection and patient</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Date of record</td><td align="left" valign="top">Date</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Minutes after diagnosis</td><td align="left" valign="top">Minutes</td><td align="left" valign="top">Difference between the time of diagnosis and the time of record</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SOFA<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> score</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">SOFA score (containing FiO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup>/pO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, thrombocytes, bilirubin, mean arterial pressure, GCS<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup> score, and creatinine), ranging from 0 to 24</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>GCS</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">GCS score ranging from 3 to 15</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RASS<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">RASS score ranging from &#x2013;5 to 4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dialysis</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient on dialysis (&#x201C;yes&#x201D; or &#x201C;no&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ventilation</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient is ventilated (&#x201C;yes&#x201D; or &#x201C;no&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Heart rate</td><td align="left" valign="top">bpm</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Body temperature</td><td align="left" valign="top">&#x00B0;C</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Respiratory rate</td><td align="left" valign="top">breaths/min</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Urine</td><td align="left" valign="top">mL/h</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diastolic Ibp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Invasive diastolic blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>mIbp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Invasive mean blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Systolic Ibp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Invasive systolic blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diastolic NIbp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Noninvasive diastolic blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>mNIbp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Noninvasive mean blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Systolic NIbp</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Noninvasive systolic blood pressure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CAM-ICU</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Confusion Assessment Method for the Intensive Care<break/>Unit (delirium &#x201C;yes&#x201D; or &#x201C;no&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Bilirubin</td><td align="left" valign="top">mg/dL</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FiO<sub>2</sub></td><td align="char" char="." valign="top">%</td><td align="left" valign="top">Fraction of inspired oxygen</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>pO<sub>2</sub></td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">Partial pressure of oxygen</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Leukocytes</td><td align="char" char="." valign="top">/nL</td><td align="left" valign="top">Number of white blood cells in the blood</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Leukocytes in the liquor</td><td align="left" valign="top">/&#x00B5;L</td><td align="left" valign="top">Number of white blood cells in the cerebrospinal fluid</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Thrombocytes</td><td align="char" char="." valign="top">10<sup>3</sup><italic>/</italic>mm<sup>3</sup></td><td align="left" valign="top">Number of thrombocytes in the blood</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CRP</td><td align="left" valign="top">mg/L</td><td align="left" valign="top">C-reactive protein</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PCT</td><td align="left" valign="top">ng/mL</td><td align="left" valign="top">Procalcitonin</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>GFR</td><td align="left" valign="top">mL/min</td><td align="left" valign="top">Glomerular filtration rate</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Creatinine</td><td align="left" valign="top">mg/dL</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IL-6</td><td align="left" valign="top">pg/mL</td><td align="left" valign="top">Interleukin 6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lactate</td><td align="left" valign="top">mmol/L</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Blood sugar</td><td align="left" valign="top">mg/dL</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Oxygenation index</td><td align="left" valign="top">mm Hg</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Antibiotic</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Name of administered antibiotic therapy</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diagnosis</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top"><italic>ICD-10<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></italic> codes of diagnosis</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Not available.</p></fn><fn id="table1fn2"><p><sup>b</sup>SOFA: Sequential Organ Failure Assessment.</p></fn><fn id="table1fn3"><p><sup>c</sup>FiO<sub>2</sub>: fraction of inspired oxygen.</p></fn><fn id="table1fn4"><p><sup>d</sup>pO<sub>2</sub>: partial pressure of oxygen.</p></fn><fn id="table1fn5"><p><sup>e</sup>GCS: Glasgow Coma Scale.</p></fn><fn id="table1fn6"><p><sup>f</sup>RASS: Richmond Agitation-Sedation Scale.</p></fn><fn id="table1fn7"><p><sup>g</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Number of patients who received the respective antibiotics between 2012 and 2023. The light blue bars represent all empiric antibiotic prescriptions (simultaneously administered therapies, ie, combined therapies, are shown separately), while the dark blue bars additionally include all subsequent administered antibiotics. If antibiotics were administered more than once to one patient, they are counted only once. Printed numbers refer to the dark blue bars.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e79929_fig02.png"/></fig><p>A review of the core data reveals that the variables weight, height, and BMI each contain 57% missing values. In addition, 15% (n=443) of patients have no suspected infection focus. However, all other information from the core data are completely available for all patients.</p><p>For a more effective comparison between patients, we extend the time series data containing laboratory values and vital signs to include the variable &#x201C;minutes after diagnosis.&#x201D; This is calculated as the difference between the suspected time of diagnosis and the time of record. Importantly, not all variables are measured constantly or at equidistant intervals; certain values, such as heart rate, however, are frequently measured. Conversely, blood values, including lactate and C-reactive protein (CRP), are typically assessed no more than once per day.</p><p>In summary, when considering the average availability of measurements per patient (excluding those with no recorded measurements for a specific value), the values with the lowest frequency of measurement are leukocytes in the liquor, with an average of 0.87 measurements per patient, and procalcitonin, with an average of 4.10 measurements per patient. In contrast, along with dialysis and ventilation, heart rate (mean of 177.31 measurements per patient) and invasive blood pressure (mean of 160.87 systolic measurements per patient) are the values with the highest availability. An overview of the frequency and availability of all time series values is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec></sec><sec id="s2-2"><title>Statistical Analysis</title><sec id="s2-2-1"><title>Overview</title><p>On our way to a CDSS applicable in situations where patients have just been diagnosed with sepsis, we aimed, as an intermediate step, at statistical models that are able to predict an empiric antibiotic therapy. Consequently, we intend to predict the prescribed empiric antibiotic therapy based on patients&#x2019; core data and health records. We address this goal through statistical classification, where each distinct therapy defines one class, and we train a classifier that assigns class memberships to patients. This is possible since the dataset used for training contains the relevant information about the administered initial antibiotic therapy, that is, the true class membership.</p><p>To start with, we assume a maximum of one measurement per variable for newly diagnosed patients. This mimics the constraints for a rapid decision after sepsis onset. Accordingly, in the Cross-Sectional Classification subheading, we reduce our dataset to cross-sectional data and apply a cross-sectional classification model (CCM).</p><p>In addition, we ask the question of how recommendations could have been improved when based on time series data. To that end, we consider time series classification models (TSCMs) in the Time Series Classification subheading.</p></sec><sec id="s2-2-2"><title>Cross-Sectional Classification</title><p>Classification is a statistical method for supervised learning, where the true class memberships of training samples are known and can be used during model training to learn a mapping of covariates to classes. After model training, this learned mapping is applied to new data to make predictions for each sample. In our work, we rely on the following classifiers, which are robust to multicollinearity: random forests (RFs), gradient boosting classifiers (GBCs), support vector classifiers (SVCs), and multilayer perceptrons (MLPs).</p><p>To train the CCMs, we further prepare the data additionally to the general preprocessing. In particular, we generate covariates that contain cross-sectional instead of time series information as required: for each time-resolved variable, we obtain the relevant values for all patients by selecting the first value measured within the first hour after diagnosis, motivated by the clinical practice to obtain key measurements immediately after diagnosis to capture the current status of a patient. We assume this information to be available at the time of treatment decision. If no measurement is available within this time interval, we use the most recent value within 24 hours before the sepsis diagnosis. Further, we summarize categories of the suspected infection focus occurring less than 50 times as &#x201C;others.&#x201D;</p><p>Many variables in the data have a high proportion of missing values. We refrain from data imputation, for example, multiple imputation [<xref ref-type="bibr" rid="ref38">38</xref>] or filling missing values by the mean across all samples, as we want to avoid introducing additional uncertainty into the data. Instead, we discard those variables that have 30% or more missing values. Accordingly, we keep the following variables: age, sex, heart rate, average arterial blood pressure, body temperature, fraction of inspired oxygen, pressure of oxygen, leukocytes, thrombocytes, CRP, creatinine, lactate, blood sugar, bilirubin, requiring dialysis, requiring ventilation, and suspected infection focus. These serve as covariates for the CCMs. We do not include systolic and diastolic blood pressure, SOFA, oxygenation index, or glomerular filtration rate as this information is already contained in other variables. After variable selection, we filter for complete cases (ie, patients without any missing values) and end up with 1194 patients for model estimation.</p><p>As the target variable (ie, the variable that determines a patient&#x2019;s class membership), we consider the first administered antibiotic therapy (or a combination of several simultaneously administered therapies) for a patient, that is, the antibiotic treatment within the first hour after the diagnosis.</p><p>In the resulting dataset, we are faced with highly imbalanced class sizes. We mitigate this imbalance by merging antibiotic therapies with fewer than 20 occurrences as &#x201C;others.&#x201D; This avoids the CCMs being trained on too few samples for some antibiotics, but even subsequent to this step, imbalanced classes in the target variable remain evident (<xref ref-type="table" rid="table2">Table 2</xref>): while the largest class, &#x201C;Piperacillin/tazobactam,&#x201D; contains 550 patients, the smallest class, namely a combined therapy of &#x201C;Piperacillin/tazobactam&#x201D; and &#x201C;Levofloxacin,&#x201D; consists of only 21 patients.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Numbers of antibiotic therapies in the German hospital cohort used for the 2-step models.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Antibiotic therapy</td><td align="left" valign="bottom">Count</td></tr></thead><tbody><tr><td align="left" valign="top">Piperacillin/Tazobactam</td><td align="left" valign="top">550</td></tr><tr><td align="left" valign="top">Other therapies</td><td align="left" valign="top">174</td></tr><tr><td align="left" valign="top">Cefotaxime</td><td align="left" valign="top">104</td></tr><tr><td align="left" valign="top">Meropenem</td><td align="left" valign="top">77</td></tr><tr><td align="left" valign="top">Ampicillin/sulbactam</td><td align="left" valign="top">75</td></tr><tr><td align="left" valign="top">Levofloxacin</td><td align="left" valign="top">54</td></tr><tr><td align="left" valign="top">Ceftriaxone</td><td align="left" valign="top">44</td></tr><tr><td align="left" valign="top">Cefuroxime</td><td align="left" valign="top">33</td></tr><tr><td align="left" valign="top">Vancomycin</td><td align="left" valign="top">33</td></tr><tr><td align="left" valign="top">Ciprofloxacin</td><td align="left" valign="top">29</td></tr><tr><td align="left" valign="top">Piperacillin/tazobactam&#x2013;levofloxacin</td><td align="left" valign="top">21</td></tr></tbody></table></table-wrap><p>Common rebalancing techniques, such as downsampling, would lead to a substantial decrease in the sample size. Thus, instead, we divide the original classification task into 2 consecutive tasks: in a first step, we perform binary classification to predict the majority class &#x201C;Piperacillin/tazobactam&#x201D; vs all others; in a second step, we perform multiclass classification to further distinguish between the remaining antibiotic therapies. As described in this section, we apply RF, GBC, SVC, and MLP as classifiers at both steps.</p><p>To account for the fairly small amount of data and to avoid model overfitting, we use nested cross-validation (CV) with an inner and an outer loop [<xref ref-type="bibr" rid="ref39">39</xref>]. The outer loop consists of 10 folds and splits the whole dataset into 10 disjunct sets. The inner loop consists of 5 folds, allowing for a grid search to optimize the models&#x2019; hyperparameters. For RF, we tune the splitting criterion, the total number of fitted trees, the maximum depth of the trees, and the minimum number of samples to perform a subsequent split. For GBC, in addition to the latter 2 parameters, we optimize the learning rate as well as the number of boosting stages. For SVC, the regularization parameter <italic>C</italic>, the kernel type, and the degree in case of a polynomial kernel are tuned during the grid search. For MLP, we optimize the number of hidden layers assuming each layer consists of 100 neurons, the activation function, the solver, the <italic>L2</italic> regularization term, and the initial learning rate. To measure the models&#x2019; performance, we use the <italic>F</italic><sub>1</sub>-score, which is the harmonic mean of precision and sensitivity.</p><p>Estimating the binary model does not require any rebalancing. The dataset (before applying CV) contains 550 patients receiving &#x201C;Piperacillin/tazobactam&#x201D; (<xref ref-type="table" rid="table2">Table 2</xref>) and 644 patients receiving a different therapy. This is, however, different for the multiclass classification in the second step. The model is trained on those patients from the training set who received an antibiotic therapy other than &#x201C;Piperacillin/tazobactam.&#x201D; As shown in <xref ref-type="table" rid="table2">Table 2</xref>, there are still large differences between the remaining 10 class sizes. At this point, after excluding the most dominant class &#x201C;Piperacillin/tazobactam,&#x201D; we opt for rebalancing to prevent the model from ignoring the minority classes. As the difference between the largest and smallest class sizes is substantial, we downsample the classes whose sizes exceed the average frequency in the training data for the second step and upsample the other classes accordingly. This procedure prevents the dataset from becoming too small, which at the same time avoids excessive duplication of samples.</p></sec><sec id="s2-2-3"><title>Time Series Classification</title><p>We apply a TSCM to investigate whether more information is beneficial to correctly predict an empiric antibiotic therapy for patients with sepsis. In contrast to the models described in the Cross-Sectional Classification subheading, TSCMs consider a time series of a sample instead of using just one measurement per variable. In the medical context, this poses a particular challenge, given that patients&#x2019; health records are typically measured at different time points rather than at uniform intervals. Consequently, the individual time series often vary in length. This requires techniques that can deal with unequal sequences, such as the <italic>k</italic>-nearest neighbor (<italic>k</italic>-NN) algorithm using dynamic time warping (DTW) to measure distances.</p><p>To apply <italic>k</italic>-NN with DTW to our data, we consider the patients&#x2019; time series starting at 24 hours before sepsis diagnosis and up to 1 hour afterwards. Our approach is based on the fact that no later measurements are available for new patients due to the need for fast antibiotic treatment. We use the same covariates and target variable as for the CCMs described in the Cross-Sectional Classification subheading. In contrast to these models, we cannot exclusively use complete cases for the TSCM, as the data basis would become far too small. Therefore, we use forward or, if no previous value is available, backward propagation to fill the missing values in the time series. This procedure is consistent with clinical practice: measurements are considered valid for 24 hours as long as the treating physicians have not seen a need for new values, for example, in case of a deterioration in a patient&#x2019;s health condition. The procedure to estimate the models is the same as for the CCMs: in a first step, we perform binary classification to derive a probability for &#x201C;Piperacillin/tazobactam,&#x201D; and in a second step, we aim at classifying those antibiotic therapies that are different from &#x201C;Piperacillin/tazobactam.&#x201D; Again, we use a nested CV and a combined procedure of upsampling and downsampling for class rebalancing in the second step.</p></sec></sec><sec id="s2-3"><title>Ethical Considerations</title><p>Ethical approval was obtained from the Ethics Committee of the Westphalia-Lippe Medical Association and the University of M&#x00FC;nster (Ethik-Kommission der &#x00C4;rztekammer Westfalen-Lippe und der Westf&#x00E4;lischen Wilhelms-Universit&#x00E4;t M&#x00FC;nster; case no 2021&#x2010;699-f-S).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Requirements and Insights From Clinical Knowledge</title><sec id="s3-1-1"><title>Overview</title><p>To enhance the reliability of the CDSS and to acknowledge its limitations, we investigated before the data analysis which kinds of information were regarded as relevant from a clinical perspective. A purely data-driven approach, in contrast, would have searched the wide variety of variables for patterns in an unrestricted manner. However, this approach carries the risk of inducing spurious correlations or therapies that may turn out impractical. Through the interviews and discussions described in the Medical Knowledge Compilation subheading, the following facts and requirements were compiled and subsequently served as a knowledge base for the nonclinical scientists in this project. The Challenges From Data Availability subheading describes to what extent the requirements were met by our data, including which variables were unavailable.</p></sec><sec id="s3-1-2"><title>Including Relevant Factors for Treatment Decision</title><p>Following a diagnosis of sepsis, there are multiple factors that the treating physician takes into consideration when selecting an appropriate antibiotic. These include, among others, core data, measured vital signs and blood values, patient allergies, known comorbidities, adverse effects, and image data (eg, x-ray images or computer tomography scans). Further, the identification of the infection focus is of utmost importance as it allows for the identification of potential pathogens once the affected organ is confirmed. However, in some cases, the focus is not provided as it is not directly recognizable.</p></sec><sec id="s3-1-3"><title>Considering Risk Factors for Antibiotic Resistances</title><p>To take potential resistances into account, whether on a global or patient-specific basis, it is necessary to consider additional kinds of information: the patient&#x2019;s origin and professional background, as well as their travel history, previous hospitalization or stay in nursing homes, and antibiotic intake within the last 3 to 6 months. This information may offer insights into the present pathogens and suspected resistances for specific patients.</p></sec><sec id="s3-1-4"><title>Evaluation of Antibiotic Effectiveness</title><p>With regard to the evaluation of antibiotic effectiveness (ie, the assessment of whether the administration of a specific antibiotic was successful in treating a particular case of sepsis), the most important information is the SOFA score, oxygenation index, procalcitonin, CRP, interleukin 6 (IL-6), body temperature, and circulatory parameters such as blood pressure, heart rate, and respiratory rate. From these, especially procalcitonin and IL-6 are also identified in the literature [<xref ref-type="bibr" rid="ref40">40</xref>]. Furthermore, leukocytes, thrombocytes, bilirubin, creatinine, lactate, the Confusion Assessment Method for the Intensive Care Unit, and urine output are considered as potential covariates. Generally, for an effective therapy, laboratory values should show a clear improvement. However, the clinical experts emphasized that the identification of relevant factors depends on the infected organ. Furthermore, they highlighted that the general health condition of a patient is more important than laboratory values. If a patient&#x2019;s well-being improves, irrespective of laboratory values, and they demonstrate, for example, increased responsiveness and alertness, it can be assumed that the administered therapy was effective.</p></sec><sec id="s3-1-5"><title>Expectations and Acceptance of CDSS</title><p>One of the conducted interview series addressed the physicians&#x2019; opinion on the practical implementation of a CDSS and revealed high interest in and need for support from such a system. This is because clinicians must process the available information within a short time frame, often facing incomplete data when the critical health status of a patient necessitates a rapid therapeutic decision. Furthermore, increasing antimicrobial resistance demands careful consideration of the numerous alternative therapies available. The establishment of a support system, therefore, is of great added value for physicians with limited practical experience, thereby helping them to make well-informed treatment decisions. However, it was also noted that there are still many operational hurdles to overcome, such as the lack of digitization in clinics or the availability of reliable and reasonable retrospective data, which hinder its use in practical hospital settings. A detailed analysis of the interviews is provided by D&#x00FC;vel et al [<xref ref-type="bibr" rid="ref14">14</xref>]. Another important requirement for a CDSS, highlighted by the medical professionals, concerned the interpretability of the underlying statistical models. Since we use interpretable classification methods rather than AI tools here, this constraint is met, but must be given careful consideration in general.</p></sec></sec><sec id="s3-2"><title>Challenges From Data Availability</title><p>A goal of this study was to determine the extent to which the ideal and theoretically formulated requirements for a CDSS align with the reality of clinical practice. The result of the investigation was that we encountered a number of challenges regarding data quality and availability, which partially led to questions not being answered to the extent we had originally envisioned. These challenges do not solely exist at our site but arise generally from the common level of data documentation in everyday clinical practice and the prospective collection of data for research purposes, influenced by the degree of digitization of clinical data in German hospitals. We provide a detailed account of the 8 most impactful difficulties here to highlight the necessities, and we describe how we overcame some of them by identifying alternative solutions.</p><p>The first major limitation was the amount of data. While we had originally planned to export data from all 3 consortium hospitals, this was made impossible due to technical limitations as well as differing processes across the hospitals. As a consequence, this study is constrained to data from a single hospital. This resulted in a rather small sample size of 2986 patients, and this in turn excluded AI-based models that require much larger amounts of data [<xref ref-type="bibr" rid="ref41">41</xref>]. Using data from several clinics would have increased the size of the dataset and provided a more representative sample of patients. It would also have enabled us to investigate how much the results differ between clinics. However, obtaining data from multiple clinics would have posed additional challenges due to expected heterogeneity in terms of patient population, prescribing practices, data quality, and other factors. An approach to jointly train generative models on data from multiple hospitals by using federated learning is described by D&#x00FC;sing et al [<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>A second substantial restriction resulted from the fact that several variables, which had been identified as highly important, were not present in the dataset. These included patient history information from which one could have derived the risk of individual resistance against certain antibiotics, such as origin, profession, travel history, and previous antibiotic prescriptions. Moreover, we lacked information on the occurrence of adverse effects, which was not even provided for severe cases. Consequently, our investigation could not address the identification of antibiotic therapies with minimal adverse effects.</p><p>Third, the suspected infection focus, which was highlighted by the doctors as one of the most relevant factors in the decision-making process for an antibiotic therapy, was not routinely documented. To still obtain a realistic prediction, patient diagnoses associated with the infection foci were used to infer the suspected infection focus for individual patients (refer to the preprocessing steps outlined in the Data subheading).</p><p>Fourth, the exact time of diagnosis was unknown in the sense that its temporal alignment was partially shifted when the documentation started after the first treatment. Hence, there is uncertainty regarding the patient&#x2019;s condition at the time of diagnosis.</p><p>Fifth, regarding the effectiveness of an antibiotic therapy, the medical experts asserted that the clinical impression of a patient was given primacy over laboratory values. Still, no such data were documented. Thus, no direct quantitative measure was available to validate the effectiveness of the given therapies.</p><p>Sixth, even for those variables that were theoretically included in the dataset, there were many missing values. Thus, despite the ongoing digitization in hospitals and the consideration of retrospective data from more than 10 years, the final sample size of complete patient data was relatively small. Our decision not to impute missing values and to consider only complete cases further contributed to the small sample size and thus limited the feasibility assessment.</p><p>Seventh, particularly in the context of time series analyses, the longitudinal measurements are obtained at varying time intervals per patient and with differing frequencies among the measured values. The generation of the variable &#x201C;minutes after diagnosis&#x201D; (refer to the Data subheading) resulted in a data matrix for longitudinal values that was extremely sparse. This issue was addressed as described in the Statistical Analysis subheading.</p><p>Eighth, concerning the primary target variable, the empiric antibiotic therapy, we encountered high class imbalance (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The 10 most frequently prescribed antibiotics accounted for more than 89% of all empiric antibiotics, with &#x201C;Piperacillin/tazobactam&#x201D; being the most frequently administered therapy, accounting for 54% (n=1765) of all prescriptions. This imbalance in prescriptions posed a major challenge in predicting outcomes for underrepresented classes and may have led to biased classification results [<xref ref-type="bibr" rid="ref42">42</xref>]. We addressed this issue with a 2-step modeling approach as outlined in the Statistical Analysis subheading.</p><p>To evaluate our classification approach beyond the previously described dataset and to gain insights into the generalizability of our method, we sought to incorporate an additional dataset. The most suitable source for this purpose was the Medical Information Mart for Intensive Care, Fourth Version database [<xref ref-type="bibr" rid="ref43">43</xref>], which contained health-related data from patients admitted to the ICU of the Beth Israel Deaconess Medical Center between 2008 and 2019. However, important information, such as the infection focus or procalcitonin measurements, were missing in the database. Further, we detected notable discrepancies between Germany and the United States of America with regard to the fundamental hospital procedures and guidelines for the management of sepsis, as well as the related data basis (eg, [<xref ref-type="bibr" rid="ref44">44</xref>]), which disqualified the Medical Information Mart for Intensive Care, Fourth Version database as a solid basis for comparison within the presented feasibility study. Thus, to develop a targeted approach for common practice in Germany, we exclusively relied on the data described and emphasized the need for more and better data about the diagnosis and treatment of patients with sepsis.</p></sec><sec id="s3-3"><title>Learnings From Statistical Modeling</title><sec id="s3-3-1"><title>Cross-Sectional Classification</title><p>Despite the aforementioned challenges, we used various approaches to statistically model the physicians&#x2019; decisions for empiric antibiotic therapy. <xref ref-type="table" rid="table3">Table 3</xref> shows the results of the CCMs (RF, GBC, SVC, and MLP) for the 3 exemplary antibiotics &#x201C;Piperacillin/tazobactam,&#x201D; &#x201C;Ciprofloxacin,&#x201D; and &#x201C;Vancomycin.&#x201D; The results of the remaining antibiotics are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendices 2</xref> and <xref ref-type="supplementary-material" rid="app3">3</xref>. Due to the outer loop of the nested CV, we obtain 10 predictions for different test sets; the tables present their averages.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Average performance of the cross-sectional classification models (CCMs) across 10 folds of nested cross-validation (CV) for 3 selected antibiotics. Measures are calculated across both classification steps and thus represent cumulative performance.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model and metric</td><td align="left" valign="bottom">Piperacillin/tazobactam</td><td align="left" valign="bottom">Ciprofloxacin</td><td align="left" valign="bottom">Vancomycin</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">RF<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.506</td><td align="left" valign="top">0.117</td><td align="left" valign="top">0.125</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.728</td><td align="left" valign="top">0.955</td><td align="left" valign="top">0.962</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.613</td><td align="left" valign="top">0.108</td><td align="left" valign="top">0.051</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.552</td><td align="left" valign="top">0.110</td><td align="left" valign="top">0.069</td></tr><tr><td align="left" valign="top" colspan="4">GBC<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.508</td><td align="left" valign="top">0.092</td><td align="left" valign="top">0.050</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.642</td><td align="left" valign="top">0.985</td><td align="left" valign="top">0.969</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.546</td><td align="left" valign="top">0.117</td><td align="left" valign="top">0.050</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.524</td><td align="left" valign="top">0.102</td><td align="left" valign="top">0.050</td></tr><tr><td align="left" valign="top" colspan="4">SVC<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.524</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.120</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.721</td><td align="left" valign="top">0.973</td><td align="left" valign="top">0.964</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.621</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.064</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.564</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.072</td></tr><tr><td align="left" valign="top" colspan="4">MLP<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.533</td><td align="left" valign="top">0.078</td><td align="left" valign="top">0.145</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.677</td><td align="left" valign="top">0.973</td><td align="left" valign="top">0.949</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.594</td><td align="left" valign="top">0.108</td><td align="left" valign="top">0.052</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.556</td><td align="left" valign="top">0.090</td><td align="left" valign="top">0.069</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>RF: random forest.</p></fn><fn id="table3fn2"><p><sup>b</sup>GBC: gradient boosting classifier.</p></fn><fn id="table3fn3"><p><sup>c</sup>SVC: support vector classifier.</p></fn><fn id="table3fn4"><p><sup>d</sup>MLP: multilayer perceptron.</p></fn></table-wrap-foot></table-wrap><p>It becomes immediately apparent that none of the models achieved high sensitivity, precision, or <italic>F</italic><sub>1</sub>-score; consequently, the models are not reliable enough for use in clinical practice. For most antibiotics, the sensitivity is lower than 22%, and in many cases it is even lower than 10%. This low sensitivity comes along with a high specificity. The only exception is &#x201C;Piperacillin/tazobactam,&#x201D; for which all 4 classification models result in a sensitivity above 50% and a specificity above 60%. MLP achieved the highest sensitivity of 53.3%; this is accompanied by a medium-high specificity of 67.7%. Compared to all other antibiotic therapies, the performance of the 4 models for predicting &#x201C;Piperacillin/tazobactam&#x201D; is satisfactory: both sensitivity and specificity, and thus precision and <italic>F</italic><sub>1</sub>-score, are moderately high. However, this performance is still insufficient for clinical implementation. Even worse results are obtained for &#x201C;Ciprofloxacin&#x201D; and &#x201C;Vancomycin&#x201D;: the highest sensitivity of 11.7% and 14.5% is achieved by RF and MLP, respectively.</p></sec><sec id="s3-3-2"><title>Time Series Classification</title><p>The averaged results from time series classification across the 10 folds of the CV for the 3 antibiotics &#x201C;Piperacillin/tazobactam,&#x201C; &#x201C;Ciprofloxacin,&#x201D; and &#x201C;Vancomycin&#x201D; are shown in <xref ref-type="table" rid="table4">Table 4</xref>. The results for the remaining antibiotics are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. No improvement over CCM results could be achieved using time series data. <italic>k</italic>-NN with DTW performed worse than the CCMs as measured by <italic>F</italic><sub>1</sub>-score. Even for &#x201C;Piperacillin/tazobactam,&#x201D; the <italic>F</italic><sub>1</sub>-score was on average 12.3% points lower when using the TSCM instead of CCMs. The poor performance for &#x201C;Ciprofloxacin&#x201D; and &#x201C;Vancomycin&#x201D; is conspicuous. In the case of &#x201C;Ciprofloxacin,&#x201D; the sensitivity is low (2%), and the same holds for &#x201C;Vancomycin&#x201D;: not a single sample belonging to this class was correctly classified.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Average performance of time series classification models (TSCMs).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">Piperacillin/tazobactam</td><td align="left" valign="bottom">Ciprofloxacin</td><td align="left" valign="bottom">Vancomycin</td></tr></thead><tbody><tr><td align="left" valign="top">Sensitivity</td><td align="left" valign="top">0.416</td><td align="left" valign="top">0.020</td><td align="left" valign="top">0.000</td></tr><tr><td align="left" valign="top">Specificity</td><td align="left" valign="top">0.572</td><td align="left" valign="top">0.991</td><td align="left" valign="top">0.952</td></tr><tr><td align="left" valign="top">Precision</td><td align="left" valign="top">0.457</td><td align="left" valign="top">0.125</td><td align="left" valign="top">0.000</td></tr><tr><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.426</td><td align="left" valign="top">0.029</td><td align="left" valign="top">0.000</td></tr></tbody></table></table-wrap></sec><sec id="s3-3-3"><title>Baseline Model</title><p>To compare the results of the described CCM and TSCM against a simple baseline model, we predict the antibiotic therapy for all patients to be &#x201C;Piperacillin/tazobactam&#x201D; without further training of a statistical model. Naturally, for all antibiotics other than &#x201C;Piperacillin/tazobactam,&#x201D; the sensitivity, precision, and <italic>F</italic><sub>1</sub>-score are zero, while the specificity is equal to one. The performance results for &#x201C;Piperacillin/tazobactam&#x201D; are shown in <xref ref-type="table" rid="table5">Table 5</xref>. As expected, the sensitivity equals one, while the specificity is zero. The <italic>F</italic><sub>1</sub>-score for &#x201C;Piperacillin/tazobactam&#x201D; equals <italic>2m / n + m</italic>, where <italic>n</italic> is the total number of patients and <italic>m</italic> is the number of those belonging to this majority class. The value of 0.629 directly results from the imbalance of class sizes and is higher for the baseline model than when applying the CCM and TSCM. However, the <italic>F</italic><sub>1</sub>-score for &#x201C;no Piperacillin/tazobactam&#x201D; equals zero. Precision is lower for the baseline model than for the CCM and similar to the TSCM. Consequently, when considering only the majority therapy, the complex modeling approaches are outperformed by a simple heuristic in terms of the <italic>F</italic><sub>1</sub>-score. This is hardly surprising since the CCM and TSCM are trained to differentiate between a number of therapies rather than putting all emphasis on the majority class. The (moderate) success is reflected in the performance metrics of the other therapies.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Performance of the baseline model for all antibiotics.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">Piperacillin/tazobactam</td><td align="left" valign="bottom">Any other antibiotics</td></tr></thead><tbody><tr><td align="left" valign="top">Sensitivity</td><td align="left" valign="top">1.000</td><td align="left" valign="top">0.000</td></tr><tr><td align="left" valign="top">Specificity</td><td align="left" valign="top">0.000</td><td align="left" valign="top">1.000</td></tr><tr><td align="left" valign="top">Precision</td><td align="left" valign="top">0.461</td><td align="left" valign="top">0.000</td></tr><tr><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.629</td><td align="left" valign="top">0.000</td></tr></tbody></table></table-wrap></sec></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Summary</title><p>We embarked on an ambitious project to develop a CDSS aimed at recommending an appropriate initial antibiotic therapy for patients with sepsis. This CDSS was intended to be applicable immediately upon diagnosis and to provide recommendations regarding potential resistance and side effects. The system was to be developed using data science methods, drawing from data collected at 3 local hospitals.</p><p>However, the situation within the clinics revealed that various factors contributed to a relatively small dataset, comprising only 1194 complete cases, along with a substantial amount of unavailable information. Contemporary AI approaches typically require large datasets; therefore, a swift implementation using large language models, which may seem straightforward to an outsider, was not feasible in this context. Instead, we took on the challenge by combining meticulous information and data preparation with the adaptation of statistical learning methods. In fact, we achieved a satisfactory classification for one of the subquestions. Nonetheless, our project uncovered several limitations, and in this paper, we outline the key insights regarding the process.</p><p>To summarize, the process included the initial stages of knowledge acquisition, data preprocessing, overcoming data-related challenges, and constructing predictive models to classify the physician&#x2019;s choice of empiric therapies. We have described each relevant step, examined the challenges involved, and presented potential models together with the results derived from the available data.</p></sec><sec id="s4-2"><title>Principal Findings: Exploration of Model Performance</title><p>Despite careful data preparation, modeling, and incorporation of clinical knowledge, the statistical models achieved only poor to moderate performance in predicting the physicians&#x2019; decision for empiric antibiotic therapy. Only the first step of the 2-step approach (ie, the classification of &#x201C;Piperacillin/tazobactam&#x201D; against all other therapies) succeeded to some extent. We identify several reasons that we suspect are contributing to this issue.</p><sec id="s4-2-1"><title>Sample Size</title><p>Good predictions require sufficient sample sizes. Our final dataset contained only 1194 samples in total. Of those, 550 belonged to the class &#x201C;Piperacillin/tazobactam,&#x201D; while all other class sizes ranged from 21 to 174. The comparably good performance in the first step of the classification procedure indicates that, all in all, our statistical models are appropriate as long as enough data are available. To put it another way, we suspect that the main reason for the poor overall predictive ability is the small sample and class sizes. Sepsis manifests in very different ways; to find similarities in patients&#x2019; health records, many more samples may be needed for analysis. To develop a reliable CDSS for clinical usage, future projects should be based on a large dataset containing several thousand patients, with particular consideration of class balance and complete data collection.</p></sec><sec id="s4-2-2"><title>Broad-Spectrum Antibiotics</title><p>Notably, the most commonly prescribed therapy, &#x201C;Piperacillin/tazobactam&#x201D; (roughly 50%), along with several other documented treatments, are broad-spectrum antibiotics. This reflects how often this type of antibiotic is prescribed in clinical practice. In some cases, this antibiotic therapy is recommended by the guidelines; however, the high frequency of prescriptions also suggests a paucity of relevant information for a more targeted treatment decision. A retrospective evaluation of administered antibiotics by medical experts, under consideration of a patient&#x2019;s disease course, could be valuable to identify a targeted and effective antibiotic therapy. In doing so, a CDSS could learn to predict the best antibiotic therapy, and its predictive performance would not be affected by erroneous data.</p></sec><sec id="s4-2-3"><title>Class Imbalance</title><p>Not only was the sample size small, but the classes were also substantially different in size. The overrepresentation of &#x201C;Piperacillin/tazobactam&#x201D; led to a notable class imbalance. To deal with this, we decided to split the classification task into 2 steps. For the first step, the prediction of &#x201C;Piperacillin/tazobactam,&#x201D; no class rebalancing was needed, and we achieved comparably good results using CCMs. Still, these results are not yet suitable for clinical practice, highlighting the need for large, high-quality datasets, in particular for AI-based classifiers. In the second step, in contrast, we had to rebalance the classes as these were still unequally represented. Depending on the method used for rebalancing, useful information was removed (eg, when using random undersampling of the majority class [<xref ref-type="bibr" rid="ref45">45</xref>]), samples were duplicated (eg, when using random oversampling of the minority class [<xref ref-type="bibr" rid="ref45">45</xref>]), or synthetic data were added, potentially containing unrealistic or even wrong information (eg, when using the synthetic minority oversampling technique [<xref ref-type="bibr" rid="ref46">46</xref>]). Consequently, the application of methods for class rebalancing comes with uncertainty. In particular, random oversampling of small classes might lead to model overfitting, resulting in a model&#x2019;s inability to learn generalizable patterns in the data. This, in conjunction with the small sample size, is a possible explanation for the poor predictive ability of the models. As already mentioned, future projects should therefore attach great importance to reliable and balanced data collection. This is one of the most relevant conditions for success in achieving good model performance.</p></sec><sec id="s4-2-4"><title>Observed Initial Treatments</title><p>To model a physician&#x2019;s decision for an empiric antibiotic therapy, we used the first administered antibiotic contained in the dataset, regardless of whether the therapy was effective, because the dataset does not contain quantified information about the effectiveness (refer to Challenges from Data Availability subheading). However, there are indications that the first antibiotic was not necessarily the most effective one and could thus lead to inappropriate predictions: the data show that, due to constant reevaluation, the administered therapy was modified several times during one infection for many patients. As a consequence, our models describe prescribing habits rather than optimal treatment decisions. If appropriate information on effectiveness becomes available, the target variable could, however, be easily adapted.</p></sec><sec id="s4-2-5"><title>Missing Information</title><p>As outlined in the Challenges from Data Availability subheading, relevant variables for an informed decision in favor of an antibiotic therapy were not included in the data. In particular, there were no variables that provided information needed to assess a patient&#x2019;s risk of infection with resistant bacteria, such as origin, travel history, profession, and previous antibiotic prescriptions. In addition, a predictive model could benefit from information about hospital-specific antibiotic resistance patterns, especially if patient-specific risk factors are not available, to limit the eligible antibiotic therapies. This information is not included in our data; however, the development of a resistance observatory was a concurrent task of the &#x201C;KINBIOTICS&#x201D; consortium [<xref ref-type="bibr" rid="ref13">13</xref>]. Without any of this information, the model may not be able to predict an antibiotic therapy that is consistent with the empiric therapy chosen by the physician. A detailed discussion with medical experts about risk factors, necessary information, and the medical process for deciding on an antibiotic therapy before data collection is crucial. Ideally, a CDSS is based on prospective data so that all necessary information can be documented and subsequently extracted. According to literature, the infection focus, information about previous hospitalizations or stays in nursing homes, travel history, and origin of a patient, comorbidities, and hospital-specific antibiotic resistance patterns are of utmost importance for choosing an adequate antibiotic therapy for ICU patients [<xref ref-type="bibr" rid="ref47">47</xref>].</p></sec><sec id="s4-2-6"><title>Uncertain Infection Focus and Time of Diagnosis</title><p>Medical experts regarded the infection focus as of high importance within the decision-making process for antibiotic therapy (refer to Requirements and Insights From Clinical Knowledge subheading). In the Data subheading, we explained how we derived the suspected focus. The alignment of confirmed and suspected focus, however, comes with uncertainty, and we consider possible errors to further affect the models&#x2019; performance. The use of retrospective discharge data to predict a hospitalization decision poses a limitation of our study, as it artificially inflates the feasibility of such a CDSS. A similar statement holds for the time point of sepsis diagnosis as derived by us. Our assumption that the time of sepsis diagnosis corresponds to the time of first administered antibiotic therapy will affect our models&#x2019; performance, as we use data for prediction that likely do not match the prescription. More precisely, our models might include values that were measured close to the time of administration of empiric antibiotics or even afterwards. This renders the models unsuitable for clinical application. This issue should be addressed in future studies by using prospective data that contains the exact time of diagnosis, as well as information on crucial variables between this time and the time of antibiotic administration.</p></sec><sec id="s4-2-7"><title>Missing Data</title><p>Many classifiers are unable to deal with missing values. Thus, we reduced the dataset to complete cases by removing certain covariates and patients. This further limits the classification models&#x2019; interpretability and increases prediction uncertainty. Further, by removing laboratory values of high clinical importance, in particular procalcitonin, our models lack inflammatory markers.</p><p>In light of all the aforementioned limitations, the poor classification performance, especially in the second step of our approach, becomes comprehensible. The shortcomings highlight the need for large, high-quality data as a basis for a reliable CDSS for the individualized prediction of a targeted, effective antibiotic therapy for patients with sepsis. Future initiatives should place the highest priority on ensuring thorough and accurate data collection.</p></sec></sec><sec id="s4-3"><title>Conclusions</title><sec id="s4-3-1"><title>Overview</title><p>Our work yields 2 principal take-home messages: first, the importance of interprofessional collaboration, and second, the need for high-quality data and improvements in data acquisition processes.</p><p>Regarding the first, interprofessional collaboration and the continuous exchange between medical experts and model constructors turned out to be crucial both in the preliminary stages of the project and during its entire progress. Such collaboration increases the chance of obtaining meaningful results as all stakeholders are aware of the requirements for data availability and quality. Many medical relationships require detailed discussion before they can be integrated into the data and modeling processes. Simultaneously, critical questions&#x2014;often stemming from one party&#x2019;s lack of expertise&#x2014;can lead to new insights and perspectives.</p><p>Regarding the second, the results of the models highlight the critical need for comprehensive and large, high-quality data. In accordance with literature (eg, [<xref ref-type="bibr" rid="ref47">47</xref>]), we particularly recommend the complete and correct collection of the following variables: time of diagnosis, administered antibiotics and their effectiveness, suspected infection focus at the time of antibiotic prescription, retrospectively confirmed infection focus, risk factors (eg, origin, profession, and travel history), and laboratory values (eg, procalcitonin, lactate, leukocytes, CRP, and IL-6). The performance of the model could be further enhanced by the incorporation of comorbidities, antibiotic allergies, and image data. At best, these values are available in electronic form, and a plausibility check is performed during data entry with the option for immediate clarification. The data should contain information on several thousand patients. We assume that an appropriate number of samples depends on the data quality.</p></sec><sec id="s4-3-2"><title>Limitations and Recommendations: Data Documentation</title><p>Our dataset contains information on patients admitted to the ICU, where they are constantly monitored. Here, certain parameters are measured in an automated way, while the measurement of many other values has to be actively initiated and is carried out manually. The latter may lead to a lack of continuity in health records, and it is expected that data from less controlled units (such as non-ICU) are of even lower quality. This is a nationwide issue, beyond the study location of Bielefeld, partially caused by strict data protection regulations, including a rigorous interpretation of the European Union&#x2019;s General Data Protection Regulation. While these rules ensure a high standard of privacy, they also contribute to comparatively slow progress in digital transformation, as reflected in the European Union&#x2019;s Digital Economy and Society Index, where Germany is positioned in the middle range in digital public services and e-government readiness [<xref ref-type="bibr" rid="ref48">48</xref>].</p><p>To improve the general documentation of health data, the optimization and expansion of digitization in German hospitals are of the highest importance. The implementation of the electronic patient record system (elektronische Patientenakte [ePA] [<xref ref-type="bibr" rid="ref49">49</xref>]), which is currently being introduced in Germany, has the potential to offer great benefits for scientific analyses. Specifically, information regarding patients&#x2019; origin, travel history, professional background, and time of diagnosis could be made more readily accessible. Even information from previous inpatient or outpatient stays can potentially provide relevant information that would be available through the ePA. The benefit of the ePA for research purposes is only provided if access to the data is granted. The draft of the German &#x201C;Forschungsdatengesetz&#x201D; [<xref ref-type="bibr" rid="ref50">50</xref>] aims at improving access to and use of data for research purposes, consequently contributing to an improvement in data availability. Moreover, a health data usage act (&#x201C;Gesundheitsdatennutzungsgesetz&#x201C; [<xref ref-type="bibr" rid="ref51">51</xref>]) was passed in March 2024 in Germany, with the objective of regulating the use of health data for research purposes in the public interest and for the data-based further development of the health care system. A further desirable future development would be the continued growth of extensive, high-quality datasets, such as those from the NFDI4Health initiative (Nationale Forschungsdateninfrastruktur f&#x00FC;r personenbezogene Gesundheitsdaten [<xref ref-type="bibr" rid="ref52">52</xref>]), making small-scale, project-specific data collections unnecessary and/or serving as external data validation resources.</p></sec><sec id="s4-3-3"><title>Limitations and Recommendations: Model Architecture</title><p>The context considered in the study led to the definition of 2 architectural elements that should be evaluated with caution and adapted to the specific context of application. These concern the 2-step approach and the choice of the performance measure for parameter optimization.</p><p>Regarding the presented 2-step approach, we observe that errors arising from misclassifications of samples in the first step are propagated to the second step. The low sensitivity and moderate specificity for &#x201C;Piperacillin/tazobactam&#x201D; indicate that a substantial number of patients are irretrievably misclassified in the first step: samples truly belonging to the class &#x201C;Piperacillin/tazobactam&#x201D; but classified as &#x201C;no Piperacillin/tazobactam&#x201D; can no longer be correctly identified in the second step, and vice versa for samples belonging to &#x201C;no Piperacillin/tazobactam&#x201D; that are predicted as &#x201C;Piperacillin/tazobactam.&#x201D; In this case, the 2-step procedure was motivated by the severe imbalance between class sizes, where upsampling or downsampling of all classes, including &#x201C;Piperacillin/tazobactam,&#x201D; would have been the less favorable option. In this sense, the model choice was meaningful. Nevertheless, the architecture should be tested for robustness when the approach is transferred to another dataset with different class distributions or potentially clearer class boundaries.</p><p>Regarding the performance measure, we aimed to simultaneously account for both false-positive and false-negative predictions, in line with our study consortium&#x2019;s objective of predicting a targeted antibiotic with minimal side effects. Therefore, we placed particular emphasis on the <italic>F</italic><sub>1</sub>-score. For the translation of this approach to other projects, we recommend close coordination with the practicing physicians and clinics and, if necessary, adaptation of the statistical optimization objective.</p></sec><sec id="s4-3-4"><title>Future Directions</title><p>The logical next steps that arise from our project are to move beyond mere classification of therapies that were prescribed in practice to providing recommendations for therapies that are expected to have high effectiveness. To overcome the lack of a quantitative measure for administered antibiotic therapies, this may involve a data-driven assessment of the health status of patients with sepsis from time series of laboratory values and vital signs. This may provide a basis for the development of methods that can learn from retrospective data to predict the best possible therapy outcome for an individual patient with sepsis. The steps achieved and presented here will contribute to the development of an effective CDSS for antibiotic prescription in sepsis, ultimately improving the survival of patients with sepsis and helping to reduce antibiotic resistance.</p></sec></sec></sec></body><back><ack><p>We thank all members of the "KINBIOTICS" project, especially the medical experts who took part in the interviews and meetings and thus made an important contribution to the model development. During the writing of this manuscript, the authors used ChatGPT (version 4.0; OpenAI) to improve language and readability. After using ChatGPT, the authors reviewed and edited the content as needed and take full responsibility for the content of the published paper. The data preprocessing was performed using R (version 4.4.2; R Core Team) [<xref ref-type="bibr" rid="ref53">53</xref>], and the models were fitted using Python (version 3.11.9; Python Software Foundation) [<xref ref-type="bibr" rid="ref54">54</xref>]. The code used for model fitting is available on GitHub [<xref ref-type="bibr" rid="ref55">55</xref>].</p></ack><notes><sec><title>Funding</title><p>This study was supported by a grant from the German Federal Ministry of Health (Bundesministerium f&#x00FC;r Gesundheit; grant no ZMVI1-2520DAT930; "KINBIOTICS").</p></sec><sec><title>Data Availability</title><p>Due to data protection and privacy regulations, we are not allowed to share the data from the German hospital used in this work.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization was conducted by CF, HM, and SS. Data curation was performed by CF, PH, HM, and SS. Formal analysis was carried out by PH, HM, and SS. Funding acquisition was secured by PC, CF, WG, OK, SR, JT, and MW. Methodology was developed by PH, HM, and SS. Project administration was managed by PC. Resources were provided by RB, PC, CD, OK, SR, SSS, JJT, MW, and DW. Supervision was conducted by PC, CF, and SR. Validation was performed by JD and SE. Visualization was performed by HM and SS. The original draft was prepared by RB, CF, HM, and SS.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">CCM</term><def><p>cross-sectional classification model</p></def></def-item><def-item><term id="abb3">CDSS</term><def><p>clinical decision support system</p></def></def-item><def-item><term id="abb4">CRP</term><def><p>C-reactive protein</p></def></def-item><def-item><term id="abb5">CV</term><def><p>cross-validation</p></def></def-item><def-item><term id="abb6">DTW</term><def><p>dynamic time warping</p></def></def-item><def-item><term id="abb7">ePA</term><def><p>elektronische Patientenakte</p></def></def-item><def-item><term id="abb8">GBC</term><def><p>gradient boosting classifier</p></def></def-item><def-item><term id="abb9"><italic>ICD-10</italic></term><def><p><italic>International Statistical Classification of Diseases, Tenth Revision</italic></p></def></def-item><def-item><term id="abb10">ICU</term><def><p>intensive care unit</p></def></def-item><def-item><term id="abb11">IL-6</term><def><p>interleukin 6</p></def></def-item><def-item><term id="abb12"><italic>k</italic>-NN</term><def><p><italic>k</italic>-nearest neighbor</p></def></def-item><def-item><term id="abb13">MLP</term><def><p>multilayer perceptron</p></def></def-item><def-item><term id="abb14">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb15">SOFA</term><def><p>sequential organ failure assessment</p></def></def-item><def-item><term id="abb16">SVC</term><def><p>support vector classifier</p></def></def-item><def-item><term id="abb17">TSCM</term><def><p>time series classification model</p></def></def-item><def-item><term id="abb18">WHO</term><def><p>World Health Organization</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Evans</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rhodes</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alhazzani</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Surviving sepsis campaign: international guidelines for management of sepsis and septic shock 2021</article-title><source>Intensive Care Med</source><year>2021</year><month>11</month><volume>47</volume><issue>11</issue><fpage>1181</fpage><lpage>1247</lpage><pub-id pub-id-type="doi">10.1007/s00134-021-06506-y</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cunha</surname><given-names>BA</given-names> </name></person-group><article-title>Antibiotic side effects</article-title><source>Med Clin North Am</source><year>2001</year><month>01</month><volume>85</volume><issue>1</issue><fpage>149</fpage><lpage>185</lpage><pub-id pub-id-type="doi">10.1016/s0025-7125(05)70309-6</pub-id><pub-id pub-id-type="medline">11190350</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ventola</surname><given-names>CL</given-names> </name></person-group><article-title>The antibiotic resistance crisis: part 1: causes and threats</article-title><source>P T</source><year>2015</year><month>04</month><volume>40</volume><issue>4</issue><fpage>277</fpage><lpage>283</lpage><pub-id pub-id-type="medline">25859123</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Melander</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Zurawski</surname><given-names>DV</given-names> </name><name name-style="western"><surname>Melander</surname><given-names>C</given-names> </name></person-group><article-title>Narrow-spectrum antibacterial agents</article-title><source>Medchemcomm</source><year>2018</year><volume>9</volume><issue>1</issue><fpage>12</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1039/C7MD00528H</pub-id><pub-id pub-id-type="medline">29527285</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murray</surname><given-names>CJL</given-names> </name><name name-style="western"><surname>Ikuta</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Sharara</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Global burden of bacterial antimicrobial resistance in 2019: a systematic analysis</article-title><source>The Lancet</source><year>2022</year><month>02</month><volume>399</volume><issue>10325</issue><fpage>629</fpage><lpage>655</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(21)02724-0</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Levy</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Marshall</surname><given-names>B</given-names> </name></person-group><article-title>Antibacterial resistance worldwide: causes, challenges and responses</article-title><source>Nat Med</source><year>2004</year><month>12</month><volume>10</volume><issue>12 Suppl</issue><fpage>S122</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1038/nm1145</pub-id><pub-id pub-id-type="medline">15577930</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ebell</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Radke</surname><given-names>T</given-names> </name></person-group><article-title>Antibiotic use for viral acute respiratory tract infections remains common</article-title><source>Am J Manag Care</source><year>2015</year><month>10</month><day>1</day><volume>21</volume><issue>10</issue><fpage>e567</fpage><lpage>75</lpage><pub-id pub-id-type="medline">26619058</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chokshi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sifri</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Cennimo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Horng</surname><given-names>H</given-names> </name></person-group><article-title>Global contributors to antibiotic resistance</article-title><source>J Glob Infect Dis</source><year>2019</year><volume>11</volume><issue>1</issue><fpage>36</fpage><lpage>42</lpage><pub-id pub-id-type="doi">10.4103/jgid.jgid_110_18</pub-id><pub-id pub-id-type="medline">30814834</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Draeger</surname><given-names>L</given-names> </name><name name-style="western"><surname>Fleischmann-Struzek</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gehrke-Beck</surname><given-names>S</given-names> </name><name name-style="western"><surname>Heintze</surname><given-names>C</given-names> </name><name name-style="western"><surname>Thomas-Rueddel</surname><given-names>DO</given-names> </name><name name-style="western"><surname>Schmidt</surname><given-names>K</given-names> </name></person-group><article-title>Barriers and facilitators to optimal sepsis care - a systematized review of healthcare professionals&#x2019; perspectives</article-title><source>BMC Health Serv Res</source><year>2025</year><month>04</month><day>24</day><volume>25</volume><issue>1</issue><fpage>591</fpage><pub-id pub-id-type="doi">10.1186/s12913-025-12777-8</pub-id><pub-id pub-id-type="medline">40275226</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="web"><article-title>KI-basierte Entscheidungsunterst&#x00FC;tzung zur antibiotika-therapie</article-title><source>KINBIOTICS</source><access-date>2025-03-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://kinbiotics.de">https://kinbiotics.de</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Radukic</surname><given-names>MT</given-names> </name><name name-style="western"><surname>Brandt</surname><given-names>D</given-names> </name><name name-style="western"><surname>Haak</surname><given-names>M</given-names> </name><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Kalinowski</surname><given-names>J</given-names> </name></person-group><article-title>Nanopore sequencing of native adeno-associated virus (AAV) single-stranded DNA using a transposase-based rapid protocol</article-title><source>NAR Genom Bioinform</source><year>2020</year><month>12</month><volume>2</volume><issue>4</issue><fpage>lqaa074</fpage><pub-id pub-id-type="doi">10.1093/nargab/lqaa074</pub-id><pub-id pub-id-type="medline">33575623</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>D&#x00FC;sing</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cimiano</surname><given-names>P</given-names> </name><name name-style="western"><surname>Rehberg</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Integrating federated learning for improved counterfactual explanations in clinical decision support systems for sepsis therapy</article-title><source>Artif Intell Med</source><year>2024</year><month>11</month><volume>157</volume><fpage>102982</fpage><pub-id pub-id-type="doi">10.1016/j.artmed.2024.102982</pub-id><pub-id pub-id-type="medline">39277983</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scherer</surname><given-names>C</given-names> </name><name name-style="western"><surname>D&#x00FC;sing</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cimiano</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Modellprojekt zur Antibiotikaresistenz-Surveillance in Ostwestfalen-Lippe</article-title><source>Epidemiologisches Bulletin</source><year>2025</year><issue>8</issue><fpage>10</fpage><lpage>22</lpage><pub-id pub-id-type="doi">10.25646/12983</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>D&#x00FC;vel</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Lampe</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kirchner</surname><given-names>M</given-names> </name><etal/></person-group><article-title>An AI-based clinical decision support system for antibiotic therapy in sepsis (KINBIOTICS): use case analysis</article-title><source>JMIR Hum Factors</source><year>2025</year><month>03</month><day>4</day><volume>12</volume><fpage>e66699</fpage><pub-id pub-id-type="doi">10.2196/66699</pub-id><pub-id pub-id-type="medline">40036494</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tokg&#x00F6;z</surname><given-names>P</given-names> </name><name name-style="western"><surname>Krayter</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hafner</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dockweiler</surname><given-names>C</given-names> </name></person-group><article-title>Decision support systems for antibiotic prescription in hospitals: a survey with hospital managers on factors for implementation</article-title><source>BMC Med Inform Decis Mak</source><year>2024</year><month>04</month><day>15</day><volume>24</volume><issue>1</issue><fpage>96</fpage><pub-id pub-id-type="doi">10.1186/s12911-024-02490-7</pub-id><pub-id pub-id-type="medline">38622595</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rudd</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Agesa</surname><given-names>KM</given-names> </name><etal/></person-group><article-title>Global, regional, and national sepsis incidence and mortality, 1990&#x2013;2017: analysis for the Global Burden of Disease Study</article-title><source>The Lancet</source><year>2020</year><month>01</month><volume>395</volume><issue>10219</issue><fpage>200</fpage><lpage>211</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(19)32989-7</pub-id><pub-id pub-id-type="medline">31911147</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="report"><article-title>Improving the prevention, diagnosis and clinical management of sepsis</article-title><year>2017</year><access-date>2026-05-01</access-date><publisher-name>World Health Assembly (WHA70)</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://apps.who.int/gb/ebwha/pdf_files/WHA70/A70_R7-en.pdf">https://apps.who.int/gb/ebwha/pdf_files/WHA70/A70_R7-en.pdf</ext-link></comment></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Deutschman</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Seymour</surname><given-names>CW</given-names> </name><etal/></person-group><article-title>The third international consensus definitions for sepsis and septic shock (Sepsis-3)</article-title><source>JAMA</source><year>2016</year><month>02</month><day>23</day><volume>315</volume><issue>8</issue><fpage>801</fpage><lpage>810</lpage><pub-id pub-id-type="doi">10.1001/jama.2016.0287</pub-id><pub-id pub-id-type="medline">26903338</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="report"><article-title>World health organization (WHO) executive board</article-title><source>Improving the prevention, diagnosis and clinical management of sepsis</source><year>2017</year><comment><ext-link ext-link-type="uri" xlink:href="https://apps.who.int/iris/bitstream/handle/10665/273181/B140_12-en.pdf?sequence=1&#x0026;isAllowed=y">https://apps.who.int/iris/bitstream/handle/10665/273181/B140_12-en.pdf?sequence=1&#x0026;isAllowed=y</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vincent</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Moreno</surname><given-names>R</given-names> </name><name name-style="western"><surname>Takala</surname><given-names>J</given-names> </name><etal/></person-group><article-title>The SOFA (sepsis-related organ failure assessment) score to describe organ dysfunction/failure. On behalf of the working group on sepsis-related problems of the European Society of Intensive Care Medicine</article-title><source>Intensive Care Med</source><year>1996</year><month>07</month><volume>22</volume><issue>7</issue><fpage>707</fpage><lpage>710</lpage><pub-id pub-id-type="doi">10.1007/BF01709751</pub-id><pub-id pub-id-type="medline">8844239</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kumar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Roberts</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wood</surname><given-names>KE</given-names> </name><etal/></person-group><article-title>Duration of hypotension before initiation of effective antimicrobial therapy is the critical determinant of survival in human septic shock</article-title><source>Crit Care Med</source><year>2006</year><month>06</month><volume>34</volume><issue>6</issue><fpage>1589</fpage><lpage>1596</lpage><pub-id pub-id-type="doi">10.1097/01.CCM.0000217961.75225.E9</pub-id><pub-id pub-id-type="medline">16625125</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sandiumenge</surname><given-names>A</given-names> </name><name name-style="western"><surname>Diaz</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bod&#x00ED;</surname><given-names>M</given-names> </name><name name-style="western"><surname>Rello</surname><given-names>J</given-names> </name></person-group><article-title>Therapy of ventilator-associated pneumonia. A patient-based approach based on the ten rules of &#x201C;The Tarragona Strategy&#x201D;</article-title><source>Intensive Care Med</source><year>2003</year><month>06</month><volume>29</volume><issue>6</issue><fpage>876</fpage><lpage>883</lpage><pub-id pub-id-type="doi">10.1007/s00134-003-1715-1</pub-id><pub-id pub-id-type="medline">12677369</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nemati</surname><given-names>S</given-names> </name><name name-style="western"><surname>Holder</surname><given-names>A</given-names> </name><name name-style="western"><surname>Razmi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Stanley</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Clifford</surname><given-names>GD</given-names> </name><name name-style="western"><surname>Buchman</surname><given-names>TG</given-names> </name></person-group><article-title>An interpretable machine learning model for accurate prediction of sepsis in the ICU</article-title><source>Crit Care Med</source><year>2018</year><month>04</month><volume>46</volume><issue>4</issue><fpage>547</fpage><lpage>553</lpage><pub-id pub-id-type="doi">10.1097/CCM.0000000000002936</pub-id><pub-id pub-id-type="medline">29286945</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>A machine learning model for accurate prediction of sepsis in ICU patients</article-title><source>Front Public Health</source><year>2021</year><volume>9</volume><fpage>754348</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2021.754348</pub-id><pub-id pub-id-type="medline">34722452</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Moor</surname><given-names>M</given-names> </name><name name-style="western"><surname>Horn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Rieck</surname><given-names>B</given-names> </name><name name-style="western"><surname>Roqueiro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Borgwardt</surname><given-names>K</given-names> </name></person-group><article-title>Early recognition of sepsis with Gaussian process temporal convolutional networks and dynamic time warping</article-title><year>2019</year><access-date>2026-05-01</access-date><conf-name>Proceedings of the 4th Machine Learning for Healthcare Conference</conf-name><conf-date>Aug 8-10, 2019</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.mlr.press/v106/moor19a.html">https://proceedings.mlr.press/v106/moor19a.html</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abromavi&#x010D;ius</surname><given-names>V</given-names> </name><name name-style="western"><surname>Plonis</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tarasevi&#x010D;ius</surname><given-names>D</given-names> </name><name name-style="western"><surname>Serackis</surname><given-names>A</given-names> </name></person-group><article-title>Two-stage monitoring of patients in intensive care unit for sepsis prediction using non-overfitted machine learning models</article-title><source>Electronics (Basel)</source><year>2020</year><volume>9</volume><issue>7</issue><fpage>1133</fpage><pub-id pub-id-type="doi">10.3390/electronics9071133</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Parente</surname><given-names>JD</given-names> </name><name name-style="western"><surname>M&#x00F6;ller</surname><given-names>K</given-names> </name><name name-style="western"><surname>Shaw</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Chase</surname><given-names>JG</given-names> </name></person-group><article-title>Hidden Markov models for sepsis classification</article-title><source>IFAC-PapersOnLine</source><year>2018</year><volume>51</volume><issue>27</issue><fpage>110</fpage><lpage>115</lpage><pub-id pub-id-type="doi">10.1016/j.ifacol.2018.11.658</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moor</surname><given-names>M</given-names> </name><name name-style="western"><surname>Rieck</surname><given-names>B</given-names> </name><name name-style="western"><surname>Horn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jutzeler</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Borgwardt</surname><given-names>K</given-names> </name></person-group><article-title>Early prediction of sepsis in the ICU using machine learning: a systematic review</article-title><source>Front Med (Lausanne)</source><year>2021</year><volume>8</volume><fpage>607952</fpage><pub-id pub-id-type="doi">10.3389/fmed.2021.607952</pub-id><pub-id pub-id-type="medline">34124082</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sakagianni</surname><given-names>A</given-names> </name><name name-style="western"><surname>Koufopoulou</surname><given-names>C</given-names> </name><name name-style="western"><surname>Feretzakis</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Using machine learning to predict antimicrobial resistance-a literature review</article-title><source>Antibiotics (Basel)</source><year>2023</year><month>02</month><day>24</day><volume>12</volume><issue>3</issue><fpage>452</fpage><pub-id pub-id-type="doi">10.3390/antibiotics12030452</pub-id><pub-id pub-id-type="medline">36978319</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garcia-Vidal</surname><given-names>C</given-names> </name><name name-style="western"><surname>Puerta-Alcalde</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cardozo</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Machine learning to assess the risk of multidrug-resistant gram-negative bacilli infections in febrile neutropenic hematological patients</article-title><source>Infect Dis Ther</source><year>2021</year><month>06</month><volume>10</volume><issue>2</issue><fpage>971</fpage><lpage>983</lpage><pub-id pub-id-type="doi">10.1007/s40121-021-00438-2</pub-id><pub-id pub-id-type="medline">33860912</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Henderson</surname><given-names>HI</given-names> </name><name name-style="western"><surname>Napravnik</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kosorok</surname><given-names>MR</given-names> </name><etal/></person-group><article-title>Predicting risk of multidrug-resistant enterobacterales infections among people with HIV</article-title><source>Open Forum Infect Dis</source><year>2022</year><month>10</month><volume>9</volume><issue>10</issue><fpage>ofac487</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofac487</pub-id><pub-id pub-id-type="medline">36225740</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feretzakis</surname><given-names>G</given-names> </name><name name-style="western"><surname>Loupelis</surname><given-names>E</given-names> </name><name name-style="western"><surname>Sakagianni</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Using machine learning techniques to aid empirical antibiotic therapy decisions in the intensive care unit of a general hospital in Greece</article-title><source>Antibiotics (Basel)</source><year>2020</year><month>01</month><day>31</day><volume>9</volume><issue>2</issue><fpage>50</fpage><pub-id pub-id-type="doi">10.3390/antibiotics9020050</pub-id><pub-id pub-id-type="medline">32023854</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewin-Epstein</surname><given-names>O</given-names> </name><name name-style="western"><surname>Baruch</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hadany</surname><given-names>L</given-names> </name><name name-style="western"><surname>Stein</surname><given-names>GY</given-names> </name><name name-style="western"><surname>Obolski</surname><given-names>U</given-names> </name></person-group><article-title>Predicting antibiotic resistance in hospitalized patients by applying machine learning to electronic medical records</article-title><source>Clin Infect Dis</source><year>2021</year><month>06</month><day>1</day><volume>72</volume><issue>11</issue><fpage>e848</fpage><lpage>e855</lpage><pub-id pub-id-type="doi">10.1093/cid/ciaa1576</pub-id><pub-id pub-id-type="medline">33070171</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tzelves</surname><given-names>L</given-names> </name><name name-style="western"><surname>Lazarou</surname><given-names>L</given-names> </name><name name-style="western"><surname>Feretzakis</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Using machine learning techniques to predict antimicrobial resistance in stone disease patients</article-title><source>World J Urol</source><year>2022</year><month>07</month><volume>40</volume><issue>7</issue><fpage>1731</fpage><lpage>1736</lpage><pub-id pub-id-type="doi">10.1007/s00345-022-04043-x</pub-id><pub-id pub-id-type="medline">35616713</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rich</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Jun</surname><given-names>I</given-names> </name><name name-style="western"><surname>Bian</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Development of a prediction model for antibiotic-resistant urinary tract infections using integrated electronic health records from multiple clinics in North-Central Florida</article-title><source>Infect Dis Ther</source><year>2022</year><month>10</month><volume>11</volume><issue>5</issue><fpage>1869</fpage><lpage>1882</lpage><pub-id pub-id-type="doi">10.1007/s40121-022-00677-x</pub-id><pub-id pub-id-type="medline">35908268</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paul</surname><given-names>M</given-names> </name><name name-style="western"><surname>Andreassen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tacconelli</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Improving empirical antibiotic treatment using TREAT, a computerized decision support system: cluster randomized trial</article-title><source>J Antimicrob Chemother</source><year>2006</year><month>12</month><volume>58</volume><issue>6</issue><fpage>1238</fpage><lpage>1245</lpage><pub-id pub-id-type="doi">10.1093/jac/dkl372</pub-id><pub-id pub-id-type="medline">16998208</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="web"><article-title>International Statistical Classification of Diseases and Related Health Problems (ICD)</article-title><source>World Health Organization (WHO)</source><year>2025</year><access-date>2025-04-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/standards/classifications/classification-of-diseases">https://www.who.int/standards/classifications/classification-of-diseases</ext-link></comment></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>van Buuren</surname><given-names>S</given-names> </name></person-group><source>Flexible Imputation of Missing Data</source><year>2018</year><edition>2</edition><publisher-name>Chapman and Hall/CRC</publisher-name><pub-id pub-id-type="doi">10.1201/9780429492259</pub-id><pub-id pub-id-type="other">9780429492259</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Parvandeh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yeh</surname><given-names>HW</given-names> </name><name name-style="western"><surname>Paulus</surname><given-names>MP</given-names> </name><name name-style="western"><surname>McKinney</surname><given-names>BA</given-names> </name></person-group><article-title>Consensus features nested cross-validation</article-title><source>Bioinformatics</source><year>2020</year><month>05</month><day>1</day><volume>36</volume><issue>10</issue><fpage>3093</fpage><lpage>3098</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btaa046</pub-id><pub-id pub-id-type="medline">31985777</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tschaikowsky</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hedwig-Geissing</surname><given-names>M</given-names> </name><name name-style="western"><surname>Braun</surname><given-names>GG</given-names> </name><name name-style="western"><surname>Radespiel-Troeger</surname><given-names>M</given-names> </name></person-group><article-title>Predictive value of procalcitonin, interleukin-6, and C-reactive protein for survival in postoperative patients with severe sepsis</article-title><source>J Crit Care</source><year>2011</year><month>02</month><volume>26</volume><issue>1</issue><fpage>54</fpage><lpage>64</lpage><pub-id pub-id-type="doi">10.1016/j.jcrc.2010.04.011</pub-id><pub-id pub-id-type="medline">20646905</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alzubaidi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Al-Sabaawi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bai</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Towards risk&#x2010;free trustworthy artificial intelligence: significance and requirements</article-title><source>Int J Intell Syst</source><year>2023</year><month>01</month><volume>2023</volume><issue>1</issue><pub-id pub-id-type="doi">10.1155/2023/4459198</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yin</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>C</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>G</given-names> </name></person-group><article-title>On the class imbalance problem</article-title><access-date>2026-05-01</access-date><conf-name>2008 Fourth International Conference on Natural Computation</conf-name><conf-date>Oct 18-20, 2008</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://ieeexplore.ieee.org/document/4667275">https://ieeexplore.ieee.org/document/4667275</ext-link></comment></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>AEW</given-names> </name><name name-style="western"><surname>Bulgarelli</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>L</given-names> </name><etal/></person-group><article-title>MIMIC-IV, a freely accessible electronic health record dataset</article-title><source>Sci Data</source><year>2023</year><month>01</month><day>3</day><volume>10</volume><issue>1</issue><fpage>1</fpage><pub-id pub-id-type="doi">10.1038/s41597-022-01899-x</pub-id><pub-id pub-id-type="medline">36596836</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martin-Loeches</surname><given-names>I</given-names> </name><name name-style="western"><surname>Rodriguez</surname><given-names>AH</given-names> </name><name name-style="western"><surname>Torres</surname><given-names>A</given-names> </name></person-group><article-title>New guidelines for hospital-acquired pneumonia/ventilator-associated pneumonia: USA vs. Europe</article-title><source>Curr Opin Crit Care</source><year>2018</year><month>10</month><volume>24</volume><issue>5</issue><fpage>347</fpage><lpage>352</lpage><pub-id pub-id-type="doi">10.1097/MCC.0000000000000535</pub-id><pub-id pub-id-type="medline">30063491</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Fern&#x00E1;ndez</surname><given-names>A</given-names> </name><name name-style="western"><surname>Garc&#x00ED;a</surname><given-names>S</given-names> </name><name name-style="western"><surname>Galar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Prati</surname><given-names>RC</given-names> </name><name name-style="western"><surname>Krawczyk</surname><given-names>B</given-names> </name><name name-style="western"><surname>Herrera</surname><given-names>F</given-names> </name></person-group><source>Learning from Imbalanced Data Sets</source><year>2018</year><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-319-98074-4</pub-id><pub-id pub-id-type="other">9783319980744</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chawla</surname><given-names>NV</given-names> </name><name name-style="western"><surname>Bowyer</surname><given-names>KW</given-names> </name><name name-style="western"><surname>Hall</surname><given-names>LO</given-names> </name><name name-style="western"><surname>Kegelmeyer</surname><given-names>WP</given-names> </name></person-group><article-title>SMOTE: synthetic minority over-sampling technique</article-title><source>jair</source><year>2002</year><volume>16</volume><fpage>321</fpage><lpage>357</lpage><pub-id pub-id-type="doi">10.1613/jair.953</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Engelmann</surname><given-names>L</given-names> </name><name name-style="western"><surname>Schmitt</surname><given-names>DV</given-names> </name></person-group><article-title>Tarragona-strategie: ad&#x00E4;quate Antibiotikatherapie auf der Intensivstation</article-title><source>Wiener Klinisches Magazin</source><year>2014</year><volume>17</volume><issue>6</issue><fpage>24</fpage><lpage>29</lpage><pub-id pub-id-type="doi">10.1007/s00740-014-0027-0</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="web"><article-title>The Digital Economy and Society Index (DESI)</article-title><source>European Commission</source><year>2024</year><access-date>2026-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://digital-strategy.ec.europa.eu/en/policies/desi">https://digital-strategy.ec.europa.eu/en/policies/desi</ext-link></comment></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="web"><article-title>Die elektronische Patientenakte (ePA) f&#x00FC;r alle</article-title><source>Bundesministerium f&#x00FC;r Gesundheit (BMG)</source><year>2025</year><access-date>2025-03-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.bundesgesundheitsministerium.de/themen/digitalisierung/elektronische-patientenakte/epa-fuer-alle.html">https://www.bundesgesundheitsministerium.de/themen/digitalisierung/elektronische-patientenakte/epa-fuer-alle.html</ext-link></comment></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="web"><article-title>Gesetz zum verbesserten zugang zu und zur nutzung von daten f&#x00FC;r die forschung</article-title><source>Deutscher Bundestag</source><year>2025</year><access-date>2025-05-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://dip.bundestag.de/vorgang/gesetz-zum-verbesserten-zugang-zu-und-zur-nutzung-von-daten/318777">https://dip.bundestag.de/vorgang/gesetz-zum-verbesserten-zugang-zu-und-zur-nutzung-von-daten/318777</ext-link></comment></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="web"><article-title>Gesetz zur verbesserten Nutzung von Gesundheitsdaten</article-title><source>Bundesministerium der Justiz und f&#x00FC;r Verbraucherschutz</source><year>2025</year><access-date>2025-05-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.recht.bund.de/bgbl/1/2024/102/VO.html">https://www.recht.bund.de/bgbl/1/2024/102/VO.html</ext-link></comment></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="web"><article-title>Homepage</article-title><source>NFDI4Health</source><year>2025</year><access-date>2025-10-16</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nfdi4health.de/">https://www.nfdi4health.de/</ext-link></comment></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="web"><article-title>The R Project for Statistical Computing</article-title><source>R Foundation for Statistical Computing</source><year>2024</year><access-date>2026-05-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.R-project.org">https://www.R-project.org</ext-link></comment></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="web"><article-title>Python language reference, version 3.11.9</article-title><source>Python Software Foundation</source><year>2024</year><access-date>2026-05-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.python.org">https://www.python.org</ext-link></comment></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="web"><article-title>Fuchslab/cdss_sepsis</article-title><source>GitHub</source><access-date>2026-05-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/fuchslab/CDSS_Sepsis">https://github.com/fuchslab/CDSS_Sepsis</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Missing values in time-series data.</p><media xlink:href="medinform_v14i1e79929_app1.pdf" xlink:title="PDF File, 506 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Additional results of cross-sectional classification models for the antibiotics &#x201C;Ampicillin/sulbactam,&#x201D; &#x201C;Cefotaxime,&#x201D; &#x201C;Ceftriaxone,&#x201D; and &#x201C;Cefuroxime.&#x201D;</p><media xlink:href="medinform_v14i1e79929_app2.pdf" xlink:title="PDF File, 239 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Additional results of cross-sectional classification models for the antibiotics &#x201C;Levofloxacin,&#x201D; &#x201C;Meropenem,&#x201D; &#x201C;Piperacillin/tazobactam-levofloxacin,&#x201D; and &#x201C;others.&#x201D;</p><media xlink:href="medinform_v14i1e79929_app3.pdf" xlink:title="PDF File, 239 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Additional results of time series classification models for the antibiotics &#x201C;Ampicillin/sulbactam,&#x201D; &#x201C;Cefotaxime,&#x201D; &#x201C;Ceftriaxone,&#x201D; &#x201C;Cefuroxime,&#x201D; &#x201C;Levofloxacin,&#x201D; &#x201C;Meropenem,&#x201D; &#x201C;Piperacillin/tazobactam-levofloxacin,&#x201D; and &#x201C;others.&#x201D;</p><media xlink:href="medinform_v14i1e79929_app4.pdf" xlink:title="PDF File, 237 KB"/></supplementary-material></app-group></back></article>