<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i6e17648</article-id>
      <article-id pub-id-type="pmid">32568089</article-id>
      <article-id pub-id-type="doi">10.2196/17648</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Toward Optimal Heparin Dosing by Comparing Multiple Machine Learning Methods: Retrospective Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Hao</surname>
            <given-names>Tianyong</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Tang</surname>
            <given-names>Buzhou</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Zhongheng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ayabakan</surname>
            <given-names>Sezgin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Su</surname>
            <given-names>Longxiang</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0942-2870</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Chun</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2337-2264</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Dongkai</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4487-0927</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>He</surname>
            <given-names>Jie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4454-1784</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Fanglan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6963-3015</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Huizhen</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8869-1237</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Hao</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7776-0882</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Gong</surname>
            <given-names>Mengchun</given-names>
          </name>
          <degrees>PhD, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8197-6643</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>Na</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6798-1761</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>Weiguo</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4215-5839</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Long</surname>
            <given-names>Yun</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Critical Care Medicine</institution>
            <institution>Peking Union Medical College Hospital</institution>
            <institution>Peking Union Medical College &#38; Chinese Academy of Medical</institution>
            <addr-line>1 Shuaifuyuan, Dongcheng District, Beijing 100730, China</addr-line>
            <addr-line>Beijing</addr-line>
            <country>China</country>
            <phone>86 10 69152318</phone>
            <email>ly_icu@aliyun.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9196-4651</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Critical Care Medicine</institution>
        <institution>Peking Union Medical College Hospital</institution>
        <institution>Peking Union Medical College &#38; Chinese Academy of Medical</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Digital China Health Technologies Co Ltd</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Information Management</institution>
        <institution>Peking Union Medical College Hospital</institution>
        <institution>Peking Union Medical College &#38; Chinese Academy of Medical</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of General Internal Medicine/Department of Information Management</institution>
        <institution>Peking Union Medical College Hospital</institution>
        <institution>Peking Union Medical College &#38; Chinese Academy of Medical</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yun Long <email>ly_icu@aliyun.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>6</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>22</day>
        <month>6</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>6</issue>
      <elocation-id>e17648</elocation-id>
      <history>
        <date date-type="received">
          <day>31</day>
          <month>12</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>23</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>4</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Longxiang Su, Chun Liu, Dongkai Li, Jie He, Fanglan Zheng, Huizhen Jiang, Hao Wang, Mengchun Gong, Na Hong, Weiguo Zhu, Yun Long. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 22.06.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2020/6/e17648/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Heparin is one of the most commonly used medications in intensive care units. In clinical practice, the use of a weight-based heparin dosing nomogram is standard practice for the treatment of thrombosis. Recently, machine learning techniques have dramatically improved the ability of computers to provide clinical decision support and have allowed for the possibility of computer generated, algorithm-based heparin dosing recommendations.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study was to predict the effects of heparin treatment using machine learning methods to optimize heparin dosing in intensive care units based on the predictions. Patient state predictions were based upon activated partial thromboplastin time in 3 different ranges: subtherapeutic, normal therapeutic, and supratherapeutic, respectively.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Retrospective data from 2 intensive care unit research databases (Multiparameter Intelligent Monitoring in Intensive Care III, MIMIC-III; e–Intensive Care Unit Collaborative Research Database, eICU) were used for the analysis. Candidate machine learning models (random forest, support vector machine, adaptive boosting, extreme gradient boosting, and shallow neural network) were compared in 3 patient groups to evaluate the classification performance for predicting the subtherapeutic, normal therapeutic, and supratherapeutic patient states. The model results were evaluated using precision, recall, F1 score, and accuracy.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Data from the MIMIC-III database (n=2789 patients) and from the eICU database (n=575 patients) were used. In 3-class classification, the shallow neural network algorithm performed the best (F1 scores of 87.26%, 85.98%, and 87.55% for data set 1, 2, and 3, respectively). The shallow neural network algorithm achieved the highest F1 scores within the patient therapeutic state groups: subtherapeutic (data set 1: 79.35%; data set 2: 83.67%; data set 3: 83.33%), normal therapeutic (data set 1: 93.15%; data set 2: 87.76%; data set 3: 84.62%), and supratherapeutic (data set 1: 88.00%; data set 2: 86.54%; data set 3: 95.45%) therapeutic ranges, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The most appropriate model for predicting the effects of heparin treatment was found by comparing multiple machine learning models and can be used to further guide optimal heparin dosing. Using multicenter intensive care unit data, our study demonstrates the feasibility of predicting the outcomes of heparin treatment using data-driven methods, and thus, how machine learning–based models can be used to optimize and personalize heparin dosing to improve patient safety. Manual analysis and validation suggested that the model outperformed standard practice heparin treatment dosing.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>heparin</kwd>
        <kwd>dosing</kwd>
        <kwd>machine learning</kwd>
        <kwd>optimization</kwd>
        <kwd>intensive care unit</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>In hospitals, intensive care units are unique in that vast amounts of information are collected and displayed by computerized systems, and that the diagnostic and treatment accuracy can profoundly affect quality of care and patient outcomes [<xref ref-type="bibr" rid="ref1">1</xref>]. Data-driven clinical decision support systems have the potential to help clinicians optimize treatment and medication in an intensive care unit to maximize the medical effect for each individual patient [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Heparin is one of the most commonly used medications in intensive care units, and intravenous unfractionated heparin is a fundamental method of anticoagulant therapy. In most clinical practice guidelines, heparin dosing is based only on the patient’s weight; the use of a weight-based heparin dosing nomogram is the standard practice for the treatment of thrombosis [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. For patients who are obese who may not receive the appropriate heparin dose if it is determined based solely on body weight, some suggestions such as reducing the initial infusion rate [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>] or using an adjusted body weight [<xref ref-type="bibr" rid="ref8">8</xref>] have been reported. In clinical practice, activated partial thromboplastin time typically reflects blood coagulation level. A high activated partial thromboplastin time means that blood is clotting slowly, whereas a low activated partial thromboplastin time means that blood is clotting quickly. Typically, blood samples are drawn every 4 to 6 hours to monitor activated partial thromboplastin time, and the anticoagulation therapy outcome is measured by whether the activated partial thromboplastin time reaches the therapeutic window in a timely manner; however, the weight-based method easily leads to improper doses which demonstrate subtherapeutic or supratherapeutic activated partial thromboplastin time. In addition, the risk factors that result from inappropriate doses of unfractionated heparin are unclear. Only high initial rates of infusion, advanced age, and being female have been reported to be associated with supratherapeutic activated partial thromboplastin time [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Heparin administration guidelines regarding initial loading dose, maintenance dose and rate, and the activated partial thromboplastin time measurement intervals vary widely among institutions. Additionally, clinicians choose different heparin administration routes such as intravenous push or intravenous drip due based on the immediate circumstances and requirements of the patient.</p>
      <p>Recently, machine learning techniques have dramatically improved the ability of computers to provide clinical decision support, resulting in the possibility of computer generated, algorithm-based heparin dosing recommendations. Multivariate logistic regression [<xref ref-type="bibr" rid="ref11">11</xref>] and multinomial logistic regression [<xref ref-type="bibr" rid="ref12">12</xref>] have been used to estimate heparin dosing with an accuracy of approximately 60%. Algorithms have also been used in studies [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] for other anticoagulants such as warfarin dose adjustments, but it was found that high intrapatient variability weakened the prediction accuracy.</p>
      <p>For these reasons, a reliable method that can help doctors quickly predict and optimize heparin doses is urgently needed. It is necessary that modeling and prediction of the therapeutic window of activated partial thromboplastin time take into account multiple factors during patient treatment in order to provide appropriate decision support suggestions which can help guide clinicians in determining and preparing subsequent heparin doses or adjusting dose rate.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Set</title>
        <p>Data were extracted from the Multiparameter Intelligent Monitoring In Intensive Care III database (MIMIC-III) [<xref ref-type="bibr" rid="ref15">15</xref>] and e–Intensive Care Unit Collaborative Research database (eICU) [<xref ref-type="bibr" rid="ref16">16</xref>] with the goal of comparing multiple predictive models and evaluating the results in different groups of patients. A cross-database evaluation was conducted. The MIMIC-III database and eICU database are free and open data sets containing medical data. The MIMIC-III database contains data from the intensive care unit at the Beth Israel Deaconess Medical Center and is published by the Laboratory for Computational Physiology at Massachusetts Institute of Technology. The eICU database, published by the Philips e–Intensive Care Unit Research Institute, is populated with data from a combination of many critical care units throughout the continental United States. Data were extracted from the databases for 14,806 adult patients who received heparin therapy during their stay in the intensive care unit. Only patient data with activated partial thromboplastin time measurements taken 4 to 6 hours after their initial heparin dose administration were used which reduced the cohort size to 3835. We chose 4 to 6 hours based on past experience and previous research [<xref ref-type="bibr" rid="ref11">11</xref>]; it is the period within which the first activated partial thromboplastin time measurement typically occurred for the greatest proportion of patients. In clinical practice, there are different administration routes to deliver medication. Both intravenous push and intravenous drip are commonly used to deliver heparin, and in practice, are chosen based on patient condition and doctor preference; therefore, patient data were further classified by administration route—intravenous push (data set 1) and intravenous drip (data sets 2 and 3).</p>
      </sec>
      <sec>
        <title>Feature Selection</title>
        <p>The outcome of interest was activated partial thromboplastin time 4 to 6 hours after initial heparin infusion. Since the data were from the Beth Israel Deaconess Medical Center, we applied the definition of therapeutic time used at Beth Israel Deaconess Medical Center for the definition of therapeutic time of activated partial thromboplastin time in this study to ensure consistency. Normal therapeutic was defined as activated partial thromboplastin times from 60 seconds to 100 seconds, supratherapeutic was defined as activated partial thromboplastin times greater than 100 seconds, and subtherapeutic was defined as activated partial thromboplastin times less than 60 seconds [<xref ref-type="bibr" rid="ref11">11</xref>]. Clinical features of interest were selected to optimize the prediction of the therapeutic activated partial thromboplastin time—age, ethnicity, gender, initial heparin dose, interval between initial heparin injection and first measurement of activated partial thromboplastin time, creatinine concentration, type of admission, and the aspartate aminotransferase to alanine aminotransferase ratio (AST/ALT ratio). These features contribute as a whole to patient outcomes, for example, creatinine in the blood is almost entirely filtered into the urine via glomerular filtration, and its concentration is stable under normal circumstances; therefore, creatinine concentration in the blood can be used as an indicator of renal function because it reflects the filtration function of glomeruli. Aspartate aminotransferase and alanine aminotransferase concentration levels in the blood are sensitive to hepatocellular damage, and their ratio is an important indicator of liver function. These features have been reported and discussed in another study [<xref ref-type="bibr" rid="ref11">11</xref>], and many of the features exhibited statistically significant relationships with the first measurement of activated partial thromboplastin time after initial heparin dose.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Patient data were preprocessed, and the features of interest were coded and normalized as variables. Missing values for some features were filled using the <italic>k</italic>–nearest neighbors algorithm which uses Euclidean distance to fill in missing values based on the values of its nearest neighbors in <italic>k</italic> dimensions.</p>
        <p>Extreme values in data affect both the training and prediction processes. Normalization is needed when preprocessing continuous features; however, extreme values, though they may be few, negatively affect the output of normalization. Continuous features (age, heparin dose, creatinine value, and AST/ALT ratio) were manually verified to have <italic>z</italic> scores within the range of –3 to +3. According to the statistical definition of outliers [<xref ref-type="bibr" rid="ref17">17</xref>], the normal range should be from <italic>z</italic>=−3 to <italic>z</italic>=+3; therefore, <italic>z</italic> scores outside of this range should be removed prior to normalization. Age data were found to be within the normal range; however, outliers were removed from initial heparin dose, creatinine concentration, and AST/ALT ratio data.</p>
      </sec>
      <sec>
        <title>Model Training and Performance Tuning</title>
        <p>The activated partial thromboplastin time value measured 4 to 6 hours after the initial heparin dose was classified using ternary classification into sub, normal, and supratherapeutic. The support vector machine, random forest, adaptive boosting, extreme gradient boosting, and shallow neural network algorithms were implemented and tested in this study.</p>
        <p>A support vector machine is based on maximization of the margin (ie, the minimum distance from the separating hyperplane to the nearest data point) between 2 classes of data. A Gaussian kernel guarantees that classification is nonlinear. Adaptive boosting, extreme gradient boosting, and random forest methods are based upon the use of boosting as the method of learning. Boosting methods select features that are known to improve model predictive power, and thus simultaneously, to reduce dimensionality. Where typically sample features are the outputs of a weak classifier that has been applied to each sample, adaptive boosting trains different weak classifiers by changing the weight of the samples, and the weak class is combined into a weighted sum that represents the final output of the boosted classifier. Extreme gradient boosting is based on gradient boosting, a process in which the algorithm learns an ensemble of boosted trees and makes a careful tradeoff between the classification error and model complexity. Extreme gradient boosting has recently become dominant in the field of applied machine learning (for example, in Kaggle competitions for structured or tabular data) [<xref ref-type="bibr" rid="ref18">18</xref>]. The random forest method grows multiple decision trees, each of which provides a classification. The forest chooses the final output by the classification that has the majority. Artificial neural networks are built of multiple layers of neurons; each neuron receives a number of input variables and passes on the results to neurons in the next layer. An artificial neural network can learn complex functions relating input to output variables and is able to deal with complex relationships between variables and functions. Our shallow neural network was built using TensorFlow (version 1.13.1).</p>
        <p>Samples from subtherapeutic, normal therapeutic, and supratherapeutic data groups were included at a 1:1:1 ratio for training and validation of the ternary classification model. Each data set was divided into 80% training and cross-validation and 20% testing.</p>
        <p>The best parameters for the support vector machine, random forest, adaptive boosting, and extreme gradient boosting algorithms were searched (GridSearch; scikitlearn package) and used to train the models. In the shallow neural network model, 2 hidden layers were used, and the number of neurons was set at 36/24 to reduce model complexity. To avoid overfitting, early stopping and regularization were needed. Dropout was also used since it is an effective method to avoiding overfitting and to improve robustness. The rectified linear unit activation function was chosen to increase nonlinearity [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. The Adam optimizer was used in model training with an initial learning rate of 0.0015. We trained the model for 1500 epochs with the dropout rate set at 0.75. To validate the predictive performance of our models, 5-fold cross-validation was used on each.</p>
      </sec>
      <sec>
        <title>Model Evaluation</title>
        <p>The following measures, <italic>precision</italic> = <italic>true positive</italic>/(<italic>true positive</italic> × <italic>false positive</italic>), <italic>recall</italic> = <italic>true positive</italic>/(<italic>true positive</italic> + <italic>false negative</italic>), <italic>F1 score</italic> = 2 × (<italic>precision</italic> × <italic>recall</italic>)/(<italic>precision</italic> + <italic>recall</italic>), and <italic>accuracy</italic> = (<italic>true positive</italic> + <italic>true negative</italic>)/( <italic>true positive</italic> + <italic>true negative</italic> + <italic>false positive</italic> + <italic>false negative</italic>), were used to evaluate the capability of our 3-class classification model [<xref ref-type="bibr" rid="ref20">20</xref>]. For samples at a ratio of 1:1:1, the microaveraged precision, recall, and F1 score are all equal to the accuracy; therefore, we only compared the average accuracy and macroaveraged precision, recall, and F1 score to gauge the classification performances of these models.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Activated Partial Thromboplastin Time Distribution in the Study Population</title>
        <p>After removing outliers, we extracted data on intravenous push patients (data set 1, n=1758) and intravenous drip patients (data set 2, n=1031) who met our inclusion criteria from the MIMIC-III database and data on intravenous drip patients (data set 3, n=575) from the eICU database, respectively. In data set 1, 25.3% (445/1758) of patients had measured values of activated partial thromboplastin time within the normal therapeutic range, 51.3% (901/1758) had measured values of activated partial thromboplastin time within the subtherapeutic range, and 23.4% (412/1758) had measured values of activated partial thromboplastin time within the supratherapeutic range. In data set 2, 27.0% (279/1031), 48.1% (496/1031), and 24.9% (256/1031) of patients had measured values of activated partial thromboplastin time within the normal, subtherapeutic, and supratherapeutic ranges, respectively, as shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. In data set 3, 27.6% (158/575), 59.0% (339/575), and 13.6% (78/575) of patients had measured values of activated partial thromboplastin time within the normal, subtherapeutic, and supratherapeutic ranges, respectively.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Patient distribution of aPPT value after initial heparin dosing.</p>
          </caption>
          <graphic xlink:href="medinform_v8i6e17648_fig1.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Summary Statistics of Selected Features</title>
        <p>A descriptive summary of patient data in data set 1, 2, and 3 according to the therapeutic range of the first measurement of activated partial thromboplastin time after the initial heparin injection is shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary statistics of selected features.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="370"/>
            <col width="190"/>
            <col width="190"/>
            <col width="190"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Patient groups and features</td>
                <td colspan="3">Therapeutic range</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td> </td>
                <td>Sub</td>
                <td>Normal</td>
                <td>Supra</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Data set 1: MIMIC-III<sup>a</sup> intravenous push (N=1756), n</bold>
                </td>
                <td>901</td>
                <td>445</td>
                <td>412</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Age (years), mean (SD)</td>
                <td>65.4 (14.6)</td>
                <td>68.1 (15.1)</td>
                <td>69.3 (14.2)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Initial heparin dose (units/hour), mean (SD)</td>
                <td>907.0 (818.8)</td>
                <td>1224.2 (1097.5)</td>
                <td>1303.5 (908.4)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">aPTT<sup>b</sup> (hours), mean (SD)</td>
                <td>4.9 (0.6)</td>
                <td>4.9 (0.6)</td>
                <td>4.9 (0.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Ethnicity, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>White</td>
                <td>639 (70.9)</td>
                <td>311 (69.9)</td>
                <td>291 (70.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Asian</td>
                <td>11 (1.2)</td>
                <td>5 (1.1)</td>
                <td>7 (1.7)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Black</td>
                <td>40 (4.4)</td>
                <td>27 (6.1)</td>
                <td>46 (11.2)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Hispanic/Latino</td>
                <td>13 (1.4)</td>
                <td>11 (2.5)</td>
                <td>14 (3.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Others</td>
                <td>198 (22.0)</td>
                <td>91 (20.4)</td>
                <td>54 (13.1)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Gender, n (%)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Male</td>
                <td>550 (61.0)</td>
                <td>256 (57.5)</td>
                <td>217 (52.7)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Female</td>
                <td>351 (39.0)</td>
                <td>189 (42.5)</td>
                <td>195 (48.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">
                  <bold>Admission type, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Elective</td>
                <td>111 (12.3)</td>
                <td>26 (5.8)</td>
                <td>15 (3.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Emergency</td>
                <td>768 (79.8)</td>
                <td>398(89.4)</td>
                <td>388 (94.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Urgent</td>
                <td>32 (3.6)</td>
                <td>21 (4.7)</td>
                <td>9 (2.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Data set 2: MIMIC-III intravenous drip (N=1031), n</bold>
                </td>
                <td>496</td>
                <td>279</td>
                <td>256</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Age (years), mean (SD)</td>
                <td>64.9 (15.4)</td>
                <td>68.6 (15.2)</td>
                <td>70.1 (14.8)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Initial heparin dose (units/hour), mean (SD)</td>
                <td>969.4 (398.3)</td>
                <td>1148.7 (395.8)</td>
                <td>1229.8 (495.3)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">aPTT (hours), mean (SD)</td>
                <td>5.0 (0.6)</td>
                <td>4.9 (0.5)</td>
                <td>5.0 (0.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Ethnicity, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>White</td>
                <td>353 (71.2)</td>
                <td>208 (74.6)</td>
                <td>179 (70.0)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Asian</td>
                <td>9 (1.8)</td>
                <td>9 (3.2)</td>
                <td>10 (3.9)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Black</td>
                <td>46 (9.3)</td>
                <td>29 (10.4)</td>
                <td>42 (16.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Hispanic/Latino</td>
                <td>12 (2.4)</td>
                <td>7 (2.5)</td>
                <td>9 (3.5)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Others</td>
                <td>76 (15.3)</td>
                <td>26 (9.3)</td>
                <td>15 (6.2)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Gender, n (%)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Male</td>
                <td>312 (62.9)</td>
                <td>163 (58.4)</td>
                <td>132 (51.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Female</td>
                <td>184 (37.1)</td>
                <td>116 (41.6)</td>
                <td>124 (48.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">
                  <bold>Admission type, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Elective</td>
                <td>59 (11.9)</td>
                <td>25 (9.0)</td>
                <td>8 (3.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Emergency</td>
                <td>436 (87.9)</td>
                <td>250 (89.6)</td>
                <td>245 (95.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Urgent</td>
                <td>1 (0.2)</td>
                <td>4 (1.4)</td>
                <td>3 (1.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Data set 3: eICU<sup>d</sup> intravenous drip (N=575), n</bold>
                </td>
                <td>339</td>
                <td>158</td>
                <td>78</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Age (years), mean (SD)</td>
                <td>64.8 (13.9)</td>
                <td>69.0 (14.4)</td>
                <td>73.1 (12.3)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Initial heparin dose (units/hour), mean (SD)</td>
                <td>1005.7 (892.6)</td>
                <td>973.5 (519.3)</td>
                <td>950.4 (539.4)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">aPTT (hours), mean (SD)</td>
                <td>5.2 (0.6)</td>
                <td>5.2 (0.6)</td>
                <td>5.2 (0.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Ethnicity, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>244 (72.0)</td>
                <td>106 (67.1)</td>
                <td>46 (59.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>4 (1.2)</td>
                <td>2 (1.3)</td>
                <td>2 (2.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Black</td>
                <td>30 (8.8)</td>
                <td>20 (12.7)</td>
                <td>9 (11.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Hispanic/Latino</td>
                <td>22 (6.5)</td>
                <td>19 (12.0)</td>
                <td>12 (15.4)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Others</td>
                <td>39 (11.5)</td>
                <td>11 (7.0)</td>
                <td>9 (11.5)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">
                  <bold>Gender, n (%)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Male</td>
                <td>217 (64.3)</td>
                <td>99 (62.7)</td>
                <td>37 (47.4)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td> </td>
                <td>Female</td>
                <td>122 (35.7)</td>
                <td>59 (37.3)</td>
                <td>41 (52.6)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">Creatinine (mg/dL), mean (SD)</td>
                <td>1.7 (1.7)</td>
                <td>2.0 (2.1)</td>
                <td>2.0 (1.5)</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td colspan="2">AST/ALT<sup>c</sup>, mean (SD)</td>
                <td>1.5 (1.2)</td>
                <td>1.7 (1.3)</td>
                <td>1.5(1.1)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Multiparameter Intelligent Monitoring In Intensive Care III database.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>First measurement of activated partial thromboplastin time.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>AST/ALT: aspartate aminotransferase ratio/alanine aminotransferase.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>eICU: e–Intensive Care Unit database.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Preprocessing Results</title>
        <p>Outliers were removed for 3 features: heparin dose, creatinine value, and AST/ALT ratio. The statistical outliers are shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Not all patients had a complete set of clinical data, for example, 154 patients were missing AST/ALT ratios, accounting for 8.76% of intravenous push patients (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). An algorithm (<italic>k</italic> nearest neighbors) was used to fill in the missing values. Since filled values accounting for up to 40% have been reported to be appropriate [<xref ref-type="bibr" rid="ref21">21</xref>], we considered the effect of filled features on the activated partial thromboplastin time as reasonable.</p>
      </sec>
      <sec>
        <title>Model Performance Results</title>
        <p>To eliminate category imbalances, we randomly selected 400 samples for each therapeutic state in data set 1, 250 samples for each therapeutic state in data set 2, and 120 samples for each therapeutic state in data set 3. For subtherapeutic and normal therapeutic classes, general downsampling was used to reduce the number of samples, while for the supratherapeutic class we used upsampling to increase the number of samples to 120; therefore, experiments used 1200 samples from data set 1, 750 samples from data set 2, and 360 samples from data set 3. Model performance results are shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>The F1 score provides a comprehensive evaluation of the model. As listed in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>, extreme gradient boosting achieved the second best F1 scores (77.58%, 73.94%, and 78.85% for data set 1, 2, and 3, respectively), second only to those of the shallow neural network (87.26%, 85.98% and 87.55% for data set 1, 2, and 3, respectively). The adaptive boosting model also performed very well in all 3 data sets (72.80%, 81.67%, and 77.65% for data set 1, 2, and 3, respectively), with scores close to those of extreme gradient boosting (77.58%, 73.94%, and 78.85% for data set 1, 2, and 3, respectively). The random forest performed slightly worse (68.20%, 73.15%, and 65.59% for data set 1, 2, and 3, respectively) than the other 4 models. The confusion matrices of all 5 models are shown in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. In further experiments, the random forest still performed better than other models that were not discussed herein, such as the Naïve Bayes, logistic regression, <italic>k</italic> nearest neighbors, and decision tree, as shown in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Macroaveraged scores for the machine learning algorithms.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="370"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Models</td>
                <td>Precision, %</td>
                <td>Recall, %</td>
                <td>F1 score, %</td>
                <td>Accuracy, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 1: MIMIC-III<sup>a</sup> (intravenous push patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>68.96</td>
                <td>68.75</td>
                <td>68.70</td>
                <td>68.75</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>74.37</td>
                <td>72.92</td>
                <td>72.80</td>
                <td>72.92</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>85.19</td>
                <td>73.33</td>
                <td>73.79</td>
                <td>73.33</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>79.27</td>
                <td>76.25</td>
                <td>77.58</td>
                <td>76.25</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>88.05</td>
                <td>86.67</td>
                <td>87.26</td>
                <td>86.67</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 2: MIMIC-III (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>66.71</td>
                <td>65.33</td>
                <td>65.06</td>
                <td>65.33</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>77.29</td>
                <td>77.33</td>
                <td>77.30</td>
                <td>77.33</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>84.59</td>
                <td>71.33</td>
                <td>71.71</td>
                <td>71.33</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>77.45</td>
                <td>77.33</td>
                <td>77.38</td>
                <td>77.33</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>85.99</td>
                <td>86.00</td>
                <td>85.98</td>
                <td>86.00</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 3: eICU<sup>b</sup> (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>66.77</td>
                <td>66.56</td>
                <td>65.59</td>
                <td>68.06</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>78.03</td>
                <td>77.78</td>
                <td>77.65</td>
                <td>77.78</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>84.74</td>
                <td>76.39</td>
                <td>76.19</td>
                <td>76.39</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>79.16</td>
                <td>79.17</td>
                <td>78.85</td>
                <td>79.17</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>87.80</td>
                <td>87.50</td>
                <td>87.55</td>
                <td>87.50</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Multiparameter Intelligent Monitoring In Intensive Care III database.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>eICU: e–Intensive Care Unit database.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>In the subtherapeutic class, adaptive boosting achieved the highest precision in data set 1 (84.48%) while the neural network model achieved highest in the other data sets (data set 2: 83.67%; data set 3: 83.33%). The support vector machine achieved the highest recall in all 3 data sets (data set 1: 100%; data set 2: 100%; data set 3: 95.83%). In the normal therapeutic class, the support vector machine with the Gaussian kernel achieved 100% precision in all 3 data sets. The shallow neural network achieved the highest recall (data set 1: 85.00%; data set 2: 86.00%; data set 3: 91.67%). In the supratherapeutic class, the support vector machine achieved the highest precision (data set 1: 100%; data set 2: 100%; data set 3: 95.24%); however, recall of the support vector machine was not very high (data set 1: 57.50%; data set 2: 58.00%; data set 3: 83.33%). The shallow neural network achieved the best recall in all 3 data sets (data set 1: 100%; data set 2: 100%; data set 3: 95.83%). Considering the comprehensive performance which is best evaluated by F1 score, the shallow neural network achieved the best F1 score in all 3 patient groups: subtherapeutic (data set 1: 79.35%; data set 2: 83.67%; data set 3: 83.33%), normal therapeutic (data set 1: 93.15%; data set 2: 87.76%; data set 3: 84.62%), and supratherapeutic (data set 1: 88.00%; data set 2: 86.54%; data set 3: 95.45%) therapeutic ranges. Additional results are listed in <xref ref-type="table" rid="table3">Table 3</xref>, <xref ref-type="table" rid="table4">Table 4</xref>, and <xref ref-type="table" rid="table5">Table 5</xref>.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Model performance for subtherapeutic.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="460"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Models</td>
                <td>Precision, %</td>
                <td>Recall, %</td>
                <td>F1 score, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 1: MIMIC-III<sup>a</sup> (intravenous push patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>67.61</td>
                <td>60.00</td>
                <td>63.58</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>84.48</td>
                <td>61.25</td>
                <td>71.01</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>55.56</td>
                <td>100</td>
                <td>71.43</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>74.32</td>
                <td>68.75</td>
                <td>71.43</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>79.35</td>
                <td>91.25</td>
                <td>84.89</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 2: MIMIC-III (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>58.82</td>
                <td>80.00</td>
                <td>67.80</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>78.43</td>
                <td>80.00</td>
                <td>79.21</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>53.76</td>
                <td>100</td>
                <td>69.93</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>74.32</td>
                <td>68.75</td>
                <td>71.43</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>83.67</td>
                <td>82.00</td>
                <td>82.83</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 3: eICU<sup>b</sup> (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>66.67</td>
                <td>58.33</td>
                <td>62.22</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>77.27</td>
                <td>70.83</td>
                <td>73.91</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>58.97</td>
                <td>95.83</td>
                <td>73.02</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>76.00</td>
                <td>79.17</td>
                <td>77.55</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>83.33</td>
                <td>83.33</td>
                <td>83.33</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Multiparameter Intelligent Monitoring In Intensive Care III database.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>eICU: e–Intensive Care Unit database.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Model performance for normal therapeutic.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="460"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Models</td>
                <td>Precision, %</td>
                <td>Recall, %</td>
                <td>F1 score, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 1: MIMIC-III<sup>a</sup> (intravenous push patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>63.64</td>
                <td>84.00</td>
                <td>72.41</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>71.26</td>
                <td>77.50</td>
                <td>74.25</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>100</td>
                <td>62.50</td>
                <td>76.92</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>78.72</td>
                <td>74.00</td>
                <td>76.29</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>93.15</td>
                <td>85.00</td>
                <td>88.89</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 2: MIMIC-III (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>73.81</td>
                <td>62.00</td>
                <td>67.39</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>78.43</td>
                <td>80.00</td>
                <td>79.21</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>100</td>
                <td>56.00</td>
                <td>71.79</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>72.55</td>
                <td>74.00</td>
                <td>73.27</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>87.76</td>
                <td>86.00</td>
                <td>86.87</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 3: eICU<sup>b</sup> (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>70.00</td>
                <td>65.00</td>
                <td>61.90</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>81.82</td>
                <td>53.85</td>
                <td>78.26</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>100</td>
                <td>50.00</td>
                <td>66.67</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>80.00</td>
                <td>66.67</td>
                <td>72.73</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>84.62</td>
                <td>91.67</td>
                <td>87.50</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Multiparameter Intelligent Monitoring In Intensive Care III database.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>eICU: e–Intensive Care Unit database.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Model performance for supratherapeutic.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="460"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Models</td>
                <td>Precision, %</td>
                <td>Recall, %</td>
                <td>F1 score, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 1: MIMIC-III<sup>a</sup> (intravenous push patients)</bold>
                </td>
                <td> </td>
                <td> </td>
                <td> </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>75.95</td>
                <td>75.00</td>
                <td>75.47</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>67.37</td>
                <td>80.00</td>
                <td>73.14</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>100</td>
                <td>57.50</td>
                <td>73.02</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>80.77</td>
                <td>78.75</td>
                <td>79.75</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>88.00</td>
                <td>82.50</td>
                <td>85.16</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 2: MIMIC-III (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>67.50</td>
                <td>54.00</td>
                <td>60.00</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>75.00</td>
                <td>72.00</td>
                <td>73.47</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>100</td>
                <td>58.00</td>
                <td>73.42</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>76.47</td>
                <td>78.00</td>
                <td>77.23</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>86.54</td>
                <td>90.00</td>
                <td>88.24</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Data set 3: eICU<sup>b</sup> (intravenous drip patients)</bold>
                </td>
                <td> </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Random forest</td>
                <td>63.64</td>
                <td>87.50</td>
                <td>73.68</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Adaptive boosting</td>
                <td>75.00</td>
                <td>87.50</td>
                <td>80.77</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Support vector machine</td>
                <td>95.24</td>
                <td>83.33</td>
                <td>88.89</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Extreme gradient boosting</td>
                <td>81.48</td>
                <td>91.67</td>
                <td>86.27</td>
              </tr>
              <tr valign="top">
                <td> </td>
                <td>Shallow neural network</td>
                <td>95.45</td>
                <td>87.50</td>
                <td>91.30</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Multiparameter Intelligent Monitoring In Intensive Care III database.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>eICU: e–Intensive Care Unit database.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>In our experiments, the neural network achieved the highest scores for all evaluation metrics. The neural network model uses multiple layers to progressively extract higher level features from the raw data which might be the reason that the neural network is able to learn some unknown features that help to provide a better classification of normal therapeutic activated partial thromboplastin time. Since different features may be correlated (such as the creatinine value and aspartate aminotransferase), linear classification models are not appropriate. Random forest, adaptive boosting, and extreme gradient boosting are ensemble learning methods. By integrating weak classifiers, classification performance was greatly improved. The support vector machine with Gaussian kernel is a widely used and powerful classifier. Gaussian kernels ensure that the classifier is nonlinear, which suited the characteristics of our data, and the method was able to demonstrate high performance; however, the neural network model was able to take into account complex relationships between the variables with complex functions. Among the methods tested, the shallow neural network performed the best. The shallow neural network achieved performance approximately 10% higher than that of the other algorithms for each metric (precision, recall, F1 score, and accuracy) in intravenous push cases (data set 1) and achieved performance approximately 9% higher than that of the other algorithm metrics in intravenous drip cases (data set 2 and data set 3). Extreme gradient boosting, adaptive boosting, and the support vector machine were the models that subperformed to the shallow neural network although their scores were, nevertheless, all above 70%. The random forest model demonstrated the worst performance.</p>
        <p>As a result of its relative high accuracy, this shallow neural network model should be able to recommend doses better than the heparin dosage guidelines which only take patient weight into account.</p>
        <p>In clinical practice, intravenous push and intravenous drip are both common delivery routes for heparin. Intravenous push heparin is always used to rescue critical patients who require timely intervention to decrease coagulation, while intravenous drip heparin is used a long-term medication to prevent thrombosis or embolic disease. These 2 administration routes have different clinical significance; therefore, we separated the patient groups from the 2 databases into 3 data sets to verify whether they would have different model predictions. The results suggested that model prediction performance was comparable among the 3 data sets, which gave us insight into the stability and suggests the model is stable regardless of administration routes or data source.</p>
      </sec>
      <sec>
        <title>Strengths</title>
        <p>Since the range of normal therapeutic activated partial thromboplastin time varies in different institutions, our shallow neural network model can be adapted to different heparin administration guidelines by adjusting the parameters. Furthermore, the model can also be applied to other drug dosage optimization problems after retraining. When treating a patient, a dose of heparin can be recommended that maximizes the normal therapeutic probability. The future application of the model prediction has the potential to enhance patient safety, minimize the risk of bleeding or a thromboembolic event, reduce medical costs, and improve the efficiency of clinicians.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>One challenge of our study was to identify the features that affect heparin doses. First, balancing both discrete features and continuous features and their relative importance would have enhanced model training performance and feature utilization but was not performed in this study. Second, different features may have been correlated, since they all contribute to the comprehensive conditions of patients; therefore, determining the intrinsic relationships would have further improved model performance. Model optimization and verification using different intensive care unit databases will be performed in future research. Drug interactions with heparin and the accumulated effects are usually not taken into account since the half-time of heparin is too short to affect the 4 to 6–hour interval that was monitored. A more precise neural network structure was not used; the next step would be to explore the intrinsic relationships between features and further validate the model results using additional clinical data sets. Since this study was conducted in a nonclinical setting, it will be further refined as it is used in practice.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>It is difficult to obtain personalized rather than broad normative data to determine drug dosage in intensive care units. Heparin dose is commonly determined based solely upon body weight, which is measured or estimated when patients arrive at the intensive care unit. Here, we distinguished 2 drug delivery routes to provide more detailed advice and choices for clinicians. The overall prediction accuracies for the 3 data sets were 88.00%, 86.00%, and 87.50%. Both delivery routes in the MIMIC-III retrospective data showed proportions of patients with activated partial thromboplastin times that were 3-fold higher than those with normal therapeutic activated partial thromboplastin times (25.3% for intravenous push patients and 27.0% for intravenous drip patients), and higher than those reported in previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>] for the multivariate logistic regression (volume under the surface=0.48) and multinomial logistic regression (accuracy=60%). Statistical results were consistent with those from previous reports. Advanced age and gender (female) were reported to be associated with supratherapeutic activated partial thromboplastin time [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], as well as a high initial heparin dose, a high AST/ALT ratio, and emergency admission-type.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The study aimed to provide support to predict heparin treatment outcomes and recommend optimal heparin dosing to clinicians. Data-driven machine learning methods were used to predict the probabilities of subtherapeutic, normal therapeutic, and supratherapeutic activated partial thromboplastin time. After comparing different models, we recommend the adoption of a support system comprising a shallow neural network with parameter adjustability. The results of this study provide new insights into personalized medication optimization and demonstrate the feasibility of applying the model in different medical institutions.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Outliers preprocessing.</p>
        <media xlink:href="medinform_v8i6e17648_app1.docx" xlink:title="DOCX File , 41 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Missing data imputation.</p>
        <media xlink:href="medinform_v8i6e17648_app2.docx" xlink:title="DOCX File , 13 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Macroaveraged scores of different algorithms on 3 different datasets.</p>
        <media xlink:href="medinform_v8i6e17648_app3.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Confusion matrix.</p>
        <media xlink:href="medinform_v8i6e17648_app4.docx" xlink:title="DOCX File , 17 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ALT</term>
          <def>
            <p>alanine aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AST</term>
          <def>
            <p>aspartate aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">eICU</term>
          <def>
            <p>e–Intensive Care Unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MIMIC-III</term>
          <def>
            <p>Multiparameter Intelligent Monitoring in Intensive Care III (or Medical Information Mart for Intensive Care III)</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the National Key Research &#38; Development Program of China (project 2018YFC0116905).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>YL, WZ, and NH are corresponding authors and take responsibility for the integrity of the work as a whole. LS, CL, DL, and JH contributed equally as co–first authors and were responsible for study conception and design. JH, FZ, and HJ were responsible for data cleaning and algorithm implementation. DL, MG, and HW were responsible for data analysis and explanation of results. LS, CL, NH, and JH drafted the manuscript. All authors revised the manuscript for important intellectual content.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Bratton</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Hirshberg</surname>
              <given-names>EL</given-names>
            </name>
          </person-group>
          <article-title>Computerized decision support in adult and pediatric critical care</article-title>
          <source>World J Crit Care Med</source>
          <year>2013</year>
          <month>12</month>
          <day>04</day>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>21</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.wjgnet.com/2220-3141/full/v2/i4/21.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.5492/wjccm.v2.i4.21</pub-id>
          <pub-id pub-id-type="medline">24701413</pub-id>
          <pub-id pub-id-type="pmcid">PMC3953873</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pirracchio</surname>
              <given-names>Romain</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>Mitchell J</given-names>
            </name>
            <name name-style="western">
              <surname>Malenica</surname>
              <given-names>Ivana</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>Jonathan</given-names>
            </name>
            <name name-style="western">
              <surname>Chambaz</surname>
              <given-names>Antoine</given-names>
            </name>
            <name name-style="western">
              <surname>Cannesson</surname>
              <given-names>Maxime</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Christine</given-names>
            </name>
            <name name-style="western">
              <surname>Resche-Rigon</surname>
              <given-names>Matthieu</given-names>
            </name>
            <name name-style="western">
              <surname>Hubbard</surname>
              <given-names>Alan</given-names>
            </name>
            <collab>ACTERREA Research Group</collab>
          </person-group>
          <article-title>Big data and targeted machine learning in action to assist medical decision in the ICU</article-title>
          <source>Anaesth Crit Care Pain Med</source>
          <year>2019</year>
          <month>08</month>
          <volume>38</volume>
          <issue>4</issue>
          <fpage>377</fpage>
          <lpage>384</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S2352556818302169?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.accpm.2018.09.008</pub-id>
          <pub-id pub-id-type="medline">30339893</pub-id>
          <pub-id pub-id-type="pii">S2352-5568(18)30216-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raschke</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Reilly</surname>
              <given-names>B M</given-names>
            </name>
            <name name-style="western">
              <surname>Guidry</surname>
              <given-names>J R</given-names>
            </name>
            <name name-style="western">
              <surname>Fontana</surname>
              <given-names>J R</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The weight-based heparin dosing nomogram compared with a "standard care" nomogram. A randomized controlled trial</article-title>
          <source>Ann Intern Med</source>
          <year>1993</year>
          <month>12</month>
          <day>01</day>
          <volume>119</volume>
          <issue>9</issue>
          <fpage>874</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-119-9-199311010-00002</pub-id>
          <pub-id pub-id-type="medline">8214998</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raschke</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gollihare</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Peirce</surname>
              <given-names>J C</given-names>
            </name>
          </person-group>
          <article-title>The effectiveness of implementing the weight-based heparin nomogram as a practice guideline</article-title>
          <source>Arch Intern Med</source>
          <year>1996</year>
          <volume>156</volume>
          <issue>15</issue>
          <fpage>1645</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="medline">8694662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spruill</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wade</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huckaby</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Leslie</surname>
              <given-names>R B</given-names>
            </name>
          </person-group>
          <article-title>Achievement of anticoagulation by using a weight-based heparin dosing protocol for obese and nonobese patients</article-title>
          <source>Am J Health Syst Pharm</source>
          <year>2001</year>
          <month>12</month>
          <day>15</day>
          <volume>58</volume>
          <issue>22</issue>
          <fpage>2143</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1093/ajhp/58.22.2143</pub-id>
          <pub-id pub-id-type="medline">11760916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gerlach</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Folino</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>Benjamin N</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>Claire V</given-names>
            </name>
            <name name-style="western">
              <surname>Stawicki</surname>
              <given-names>Stansilaw P</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>Charles H</given-names>
            </name>
          </person-group>
          <article-title>Comparison of heparin dosing based on actual body weight in non-obese, obese and morbidly obese critically ill patients</article-title>
          <source>Int J Crit Illn Inj Sci</source>
          <year>2013</year>
          <month>07</month>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>195</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24404457"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/2229-5151.119200</pub-id>
          <pub-id pub-id-type="medline">24404457</pub-id>
          <pub-id pub-id-type="pii">IJCIIS-3-195</pub-id>
          <pub-id pub-id-type="pmcid">PMC3883198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hohner</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kruer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gilmore</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Streiff</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbs</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Unfractionated heparin dosing for therapeutic anticoagulation in critically ill obese adults</article-title>
          <source>J Crit Care</source>
          <year>2015</year>
          <month>05</month>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>395</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jcrc.2014.11.020</pub-id>
          <pub-id pub-id-type="medline">25534987</pub-id>
          <pub-id pub-id-type="pii">S0883-9441(14)00486-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tesdal</surname>
              <given-names>Emily</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of heparin dosing based on adjusted body weight in obese patients</article-title>
          <source>Am J Health Syst Pharm</source>
          <year>2016</year>
          <month>10</month>
          <day>01</day>
          <volume>73</volume>
          <issue>19</issue>
          <fpage>1512</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.2146/ajhp150388</pub-id>
          <pub-id pub-id-type="medline">27646813</pub-id>
          <pub-id pub-id-type="pii">73/19/1512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Melloni</surname>
              <given-names>Chiara</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>Karen P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Anita Y</given-names>
            </name>
            <name name-style="western">
              <surname>Newby</surname>
              <given-names>L Kristin</given-names>
            </name>
            <name name-style="western">
              <surname>Roe</surname>
              <given-names>Matthew T</given-names>
            </name>
            <name name-style="western">
              <surname>Allen LaPointe</surname>
              <given-names>Nancy M</given-names>
            </name>
            <name name-style="western">
              <surname>Pollack</surname>
              <given-names>Charles V</given-names>
            </name>
            <name name-style="western">
              <surname>Gibler</surname>
              <given-names>W Brian</given-names>
            </name>
            <name name-style="western">
              <surname>Ohman</surname>
              <given-names>E Magnus</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>Eric D</given-names>
            </name>
            <collab>CRUSADE Investigators</collab>
          </person-group>
          <article-title>Unfractionated heparin dosing and risk of major bleeding in non-ST-segment elevation acute coronary syndromes</article-title>
          <source>Am Heart J</source>
          <year>2008</year>
          <month>08</month>
          <volume>156</volume>
          <issue>2</issue>
          <fpage>209</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.ahj.2008.03.023"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ahj.2008.03.023</pub-id>
          <pub-id pub-id-type="medline">18657648</pub-id>
          <pub-id pub-id-type="pii">S0002-8703(08)00233-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Califf</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>Eric J</given-names>
            </name>
            <name name-style="western">
              <surname>Granger</surname>
              <given-names>Christopher B</given-names>
            </name>
            <name name-style="western">
              <surname>Hochman</surname>
              <given-names>Judith S</given-names>
            </name>
          </person-group>
          <article-title>The determinants of activated partial thromboplastin time, relation of activated partial thromboplastin time to clinical outcomes, and optimal dosing regimens for heparin treated patients with acute coronary syndromes: a review of GUSTO-IIb</article-title>
          <source>J Thromb Thrombolysis</source>
          <year>2002</year>
          <month>10</month>
          <volume>14</volume>
          <issue>2</issue>
          <fpage>91</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1023/a:1023235926825</pub-id>
          <pub-id pub-id-type="medline">12714828</pub-id>
          <pub-id pub-id-type="pii">5120285</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Richter</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Eche</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Danziger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>A data-driven approach to optimized medication dosing: a focus on heparin</article-title>
          <source>Intensive Care Med</source>
          <year>2014</year>
          <month>10</month>
          <day>5</day>
          <volume>40</volume>
          <issue>9</issue>
          <fpage>1332</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25091788"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00134-014-3406-5</pub-id>
          <pub-id pub-id-type="medline">25091788</pub-id>
          <pub-id pub-id-type="pmcid">PMC4157935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alhanai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Westover</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nemati</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Personalized Medication Dosing Using Volatile Data Streams</article-title>
          <source>Workshops at the Thirty-Second AAAI Conference on Artificial Intelligence</source>
          <year>2018</year>
          <month>06</month>
          <day>20</day>
          <conf-name>Personalized medication dosing using volatile data streams. Workshops at the Thirty-Second AAAI Conference on Artificial Intelligence</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>the Hilton New Orleans Riverside, New Orleans, Louisiana, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/17234"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grzymala-Lubanski</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Själander</surname>
              <given-names>Sara</given-names>
            </name>
            <name name-style="western">
              <surname>Renlund</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Svensson</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Själander</surname>
              <given-names>Anders</given-names>
            </name>
          </person-group>
          <article-title>Computer aided warfarin dosing in the Swedish national quality registry AuriculA - Algorithmic suggestions are performing better than manually changed doses</article-title>
          <source>Thromb Res</source>
          <year>2013</year>
          <month>03</month>
          <volume>131</volume>
          <issue>2</issue>
          <fpage>130</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.thromres.2012.11.016</pub-id>
          <pub-id pub-id-type="medline">23232091</pub-id>
          <pub-id pub-id-type="pii">S0049-3848(12)00837-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Personalized anticoagulant management using reinforcement learning</article-title>
          <source>ELECTRONIC THESES AND DISSERTATIONS</source>
          <year>2014</year>
          <month>05</month>
          <fpage>670</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ir.library.louisville.edu/etd/670/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18297/etd/670</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>Leo Anthony</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AEW</given-names>
            </name>
            <name name-style="western">
              <surname>Raffa</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Badawi</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The eICU Collaborative Research Database, a freely available multi-center database for critical care research</article-title>
          <source>Sci Data</source>
          <year>2018</year>
          <month>09</month>
          <day>11</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>180178</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30204154"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2018.178</pub-id>
          <pub-id pub-id-type="medline">30204154</pub-id>
          <pub-id pub-id-type="pii">sdata2018178</pub-id>
          <pub-id pub-id-type="pmcid">PMC6132188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cousineau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chartier</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Outliers detection and treatment: a review</article-title>
          <source>Int. j. psychol. res</source>
          <year>2010</year>
          <month>06</month>
          <day>30</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>58</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.21500/20112084.844</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <source>Proceedings of the 22nd ACM SIGKDD international Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <month>08</month>
          <conf-name>Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 2016</conf-date>
          <conf-loc>San Francisco</conf-loc>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krizhevsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>ImageNet classification with deep convolutional neural networks</article-title>
          <source>Neural Information Processing Systems 25</source>
          <year>2012</year>
          <conf-name>International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>2012</conf-date>
          <conf-loc>Lake Tahoe, Nevada, United States</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sokolova</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lapalme</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A systematic analysis of performance measures for classification tasks</article-title>
          <source>Information Processing &#38; Management</source>
          <year>2009</year>
          <month>7</month>
          <volume>45</volume>
          <issue>4</issue>
          <fpage>427</fpage>
          <lpage>437</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2009.03.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farhangfar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kurgan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dy</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Impact of imputation of missing values on classification error for discrete data</article-title>
          <source>Pattern Recognition</source>
          <year>2008</year>
          <month>12</month>
          <volume>41</volume>
          <issue>12</issue>
          <fpage>3692</fpage>
          <lpage>3705</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.patcog.2008.05.019"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2008.05.019</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
