<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e11728</article-id>
      <article-id pub-id-type="pmid">30747712</article-id>
      <article-id pub-id-type="doi">10.2196/11728</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Development of Prediction Models Using Machine Learning Algorithms for Girls with Suspected Central Precocious Puberty: Retrospective Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cai</surname>
            <given-names>Pengshan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chen</surname>
            <given-names>Jinying</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
          <name name-style="western">
            <surname>Pan</surname>
            <given-names>Liyan</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7306-4916</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Guangjian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9275-9214</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3" equal-contrib="yes">
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>Xiaojian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-4915-4903</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Huixian</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5722-8602</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib5">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Jiexin</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1630-380X</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib6" equal-contrib="yes">
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>Huiying</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-9987-8002</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib7" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Xiuzhen</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Genetics and Endocrinology</institution>
            <institution>Guangzhou Women and Children’s Medical Center</institution>
            <institution>Guangzhou Medical University</institution>
            <addr-line>9 Jinsui Road</addr-line>
            <addr-line>Tianhe District</addr-line>
            <addr-line>Guangzhou, 510623</addr-line>
            <country>China</country>
            <phone>86 02038857692</phone>
            <fax>86 02038857692</fax>
            <email>13725100840@163.com</email>
          </address>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5124-3051</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>Institute of Pediatrics</institution>
      <institution>Guangzhou Women and Children's Medical Center</institution>  
      <institution>Guangzhou Medical University</institution>  
      <addr-line>Guangzhou</addr-line>
      <country>China</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Department of Genetics and Endocrinology</institution>
      <institution>Guangzhou Women and Children’s Medical Center</institution>  
      <institution>Guangzhou Medical University</institution>  
      <addr-line>Guangzhou</addr-line>
      <country>China</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Xiuzhen Li 
        <email>13725100840@163.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><season>Jan-Mar</season><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>12</day>
        <month>02</month>
        <year>2019</year>
      </pub-date>
      <volume>7</volume>
      <issue>1</issue>
      <elocation-id>e11728</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>30</day>
          <month>7</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>6</day>
          <month>9</month>
          <year>2018</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="accepted">
          <day>9</day>
          <month>12</month>
          <year>2018</year>
        </date>
      </history>
      <copyright-statement>©Liyan Pan, Guangjian Liu, Xiaojian Mao, Huixian Li, Jiexin Zhang, Huiying Liang, Xiuzhen Li. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 12.02.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2019/1/e11728/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Central precocious puberty (CPP) in girls seriously affects their physical and mental development in childhood. The method of diagnosis—gonadotropin-releasing hormone (GnRH)–stimulation test or GnRH analogue (GnRHa)–stimulation test—is expensive and makes patients uncomfortable due to the need for repeated blood sampling.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to combine multiple CPP–related features and construct machine learning models to predict response to the GnRHa-stimulation test.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In this retrospective study, we analyzed clinical and laboratory data of 1757 girls who underwent a GnRHa test in order to develop XGBoost and random forest classifiers for prediction of response to the GnRHa test. The local interpretable model-agnostic explanations (LIME) algorithm was used with the black-box classifiers to increase their interpretability. We measured sensitivity, specificity, and area under receiver operating characteristic (AUC) of the models.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Both the XGBoost and random forest models achieved good performance in distinguishing between positive and negative responses, with the AUC ranging from 0.88 to 0.90, sensitivity ranging from 77.91% to 77.94%, and specificity ranging from 84.32% to 87.66%. Basal serum luteinizing hormone, follicle-stimulating hormone, and insulin-like growth factor-I levels were found to be the three most important factors. In the interpretable models of LIME, the abovementioned variables made high contributions to the prediction probability.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The prediction models we developed can help diagnose CPP and may be used as a prescreening tool before the GnRHa-stimulation test.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>central precocious puberty</kwd>
        <kwd>GnRHa-stimulation test</kwd>
        <kwd>machine learning</kwd>
        <kwd>prediction model</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Precocious puberty is related to the development of secondary sexual characteristics in girls before the age of 8 years and in boys before the age of 9 years. In recent years, the age of puberty onset has shown a decreasing trend, and puberty is related to subsequent health outcomes such as breast cancer, diabetes, and behavioral disorders [<xref ref-type="bibr" rid="ref1">1</xref>]. Central precocious puberty (CPP), also known as true precocious puberty, is caused by early activation of the hypothalamic-pituitary-gonadal axis with clinical pubertal symptoms. CPP can influence final adult height and result in psychological problems, which will cause inappropriate behaviors. It is important for girls with suspected CPP to be evaluated and diagnosed in a timely manner.</p>
      <p>The gold standard in the confirmation of CPP is the positive response of gonadotropin to a gonadotropin-releasing hormone (GnRH)–stimulation test. In the absence of GnRH, GnRH analogues (GnRHa) are usually used instead [<xref ref-type="bibr" rid="ref2">2</xref>]. However, the stimulation test is time consuming and expensive. Besides, the test is painful and make patients uncomfortable due to the need for repeated blood sampling at different time points. Therefore, another method to avoid the disadvantages of the GnRHa-stimulation test will be of great help in the diagnosis of CPP.</p>
      <p>Several studies have focused on investigating a single gonadotropin biomarker to identify patients with CPP conveniently. Basal or peak serum luteinizing hormone (LH), follicle-stimulation hormone (FSH), and the ratio LH/FSH are the most common biomarkers reported [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. However, the cut-off values of these single biomarkers depend on the assay used to measure the gonadotropin levels. As a result, cut-off points in previous studies differed widely. Moreover, both the Pasternak group [<xref ref-type="bibr" rid="ref3">3</xref>] and the Mogensen group [<xref ref-type="bibr" rid="ref8">8</xref>] reported that a single basal serum LH measurement could verify the presence of CPP, but could not confirm the absence of CPP. Therefore, a single gonadotropin parameter alone may not be sufficient for the diagnosis of CPP, and clinical and laboratory factors that can predict response to the GnRHa-stimulation test should be combined [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Suh et al [<xref ref-type="bibr" rid="ref10">10</xref>] found that accelerated growth rate, advanced bone age, and increased basal gonadotropin and insulin-like growth factor-I (IGF-I) levels were correlated with CPP. Traditional statistical analysis including <italic>t</italic> test and binary logistic regression were used to select factors correlated with the GnRH test [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Although remarkable progress has been made in these studies, there is a long way to go for their application in clinics due to the low sensitivity or specificity of tests.</p>
      <p>Considering the previous studies and the extensive application of machine learning algorithms in the medical field, we aimed to determine whether combining multiple variables with machine learning classifiers could improve prediction of the GnRHa-stimulation test and thus help diagnose CPP.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Population and Variables</title>
        <p>We enrolled 1757 girls with CPP symptoms who visited the Pediatric Day Ward of the Endocrinology Department at Guangzhou Women and Children’s Medical Center from January 2012 to March 2018. All subjects had undergone the GnRHa-stimulation test. Girls with any other disorders or intracranial lesions were excluded from the study.</p>
        <p>Girls fulfilling the following eligibility criteria were considered to have a positive response to the GnRHa-stimulation test and were diagnosed with CPP in our study: (1) peak LH level ≥ 10 IU/L or peak LH level ≥ 5 IU/L combined with a ratio of peak LH to FSH value ≥ 0.6 and (2) onset of secondary sexual characteristics at the age &lt; 8 years. Girls whose laboratory tests did not satisfy all the abovementioned criteria were considered to have a negative response. According to the long-term clinical practices, the first condition with a peak LH ≥ 10 IU/L is used as the diagnosing criterion in our hospital. Peak LH level ≥ 5 IU/L combined with a ratio of peak LH to FSH value ≥ 0.6 is widely used in China and some other countries for children undergoing the GnRH-stimulation test [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Since the stimulation effect of GnRHa is almost hundreds times that of GnRH [<xref ref-type="bibr" rid="ref17">17</xref>], a condition that affects the levels of sex hormones due to GnRH would do the same with GnRHa. Our diagnostic criteria are an improved version of the existing criteria that are adapted to our population.</p>
        <p>Information such as chief complaints, development of secondary sexual characters, and abnormal duration of puberty were stored as free text in the clinical records of the electronic medical records system. Laboratory test values were reported as structured data in the laboratory information system. In total, 19 variables were extracted from the clinical records and laboratory results for all the 1757 patients. Specifically, 10 variables extracted from the clinical records were weight, height, body mass index (BMI), abnormal duration of puberty in records (History), menarche, core in breast (Core), pigmentation, development stage of pubes (Pubes), development stage of left breast, and development stage of right breast. Breast and pubic hair development were evaluated using Tanner staging (stages 1 to 5). Nine variables extracted from the laboratory results were age, basal serum LH, FSH, estradiol, prolactin, testosterone, growth hormone, IGF-I, IGF-binding protein-3 levels before the GnRHa test.</p>
        <p>Among the 1757 patients, 436 girls had examination reports available, including pelvic ultrasonography (for development of the uterus and ovaries) and radiography of the left hand (for bone age). Six variables extracted from the examination reports were development of uterus, existence of follicle, uterine volume, left and right ovary volumes, and bone age. Bone age was measured by the Greulich and Pyle method [<xref ref-type="bibr" rid="ref18">18</xref>]. The variables from the clinical records and the examination reports were extracted first with traditional regex match using Python [<xref ref-type="bibr" rid="ref19">19</xref>] and then examined manually by two endocrinologists.</p>
        <p>This study was approved by the Institutional Review Board of Guangzhou Women and Children’s Medical Center and conducted in accordance with the ethical guidelines of the Declaration of Helsinki of the World Medical Association. The requirement to obtain informed consent was waived because of the retrospective nature of the study. Data used in this study were anonymous, and no identifiable personal data of the patients were available for the analysis.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Variables with more than 20% missing data, such as growth rate of height and weight and heights of parents, were excluded from this study. Missing values for continuous variables were replaced with mean values of all the samples grouped by age. Discrete variables like experience of menarche were filled with a value of 0. Discrete variables like Tanner stage for breast and pubes were filled with the least degree (stage 1).</p>
      </sec>
      <sec>
        <title>Model Development and Assessment</title>
        <p>Tree learning classifiers allow nonlinear interactions between features and have good interpretability. Considering this, we selected two tree-based ensemble binary classification algorithms—extreme gradient boosting (XGBoost) and random forest—to develop our models. We also used linear supported vector machines (SVM) and decision trees for the classification to compare the performance between ensemble models and nonensemble models. The models aimed to identify relationships between the input features and the output GnRHa test results, thereby determining whether a patient responds positively to the GnRHa test.</p>
        <p>XGBoost is a scalable tree boosting and effective learning algorithm [<xref ref-type="bibr" rid="ref20">20</xref>]. It trains a sequence of models to minimize errors made by existing models. Models in XGBoost are decision trees. Many data scientists have applied this algorithm to solve classification problems and achieved excellent results. XGBoost has also been successfully used in medical studies [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. As XGBoost is essentially a gradient boosting tree model, which is not based on distance, normalization is not required. Random forest is another classical ensemble learning algorithm with a combination of a large amount of trees [<xref ref-type="bibr" rid="ref23">23</xref>], which trains decision trees in parallel by using data with replacement. It applies bootstrap aggregating to tree learners, which leads to better performance as variance decreases. Random forest has the ability to handle nonlinear data and is robust to noise. Besides, parameter tuning is not that complex for these two algorithms compared to other ensemble learning algorithms. SVM is a binary classifier with a maximum margin hyperplane [<xref ref-type="bibr" rid="ref24">24</xref>]. The decision tree classifier is a tree-like model used for classification [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        <p>In order to obtain robust assessments and prevent overfitting, we used a nested cross-validation with an outer Monte Carlo cross-validation [<xref ref-type="bibr" rid="ref26">26</xref>] (MCCV, repeated 20 times) and an inner k-fold cross-validation (k=5) for parameter tuning, yielding a total of 20 times the five-fold cross-validation. In the outer MCCV loop, the whole data set is randomly divided into the training set (80%) and the test set (20%) for 20 times. For each training set, the inner stratified five-fold cross-validation loop is performed as follows. The training set is split into five subsets, where four subsets are used for training and one is used for test. Parameter tuning is performed with grid search in the inner cross-validation. Finally, a model fitted on the training set with parameters that has the best area under the curve (AUC) evaluated on the inner test set is determined. The detailed training and test process is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p>
      </sec>
      <sec>
        <title>Feature Importance</title>
        <p>XGBoost and random forest classifier have the ability to evaluate the importance of features. Feature importance is a feature weight and can represent the contribution to prediction. In XGBoost, feature importance is computed by the sum of times that the feature is selected as a tree node. In random forest, feature importance is calculated based on the out-of-bag (OOB) error. OOB error is the mean prediction error for training observations in the respective bootstrap sample. After randomly adding noise perturbations to OOB samples, a feature with a higher OOB error difference is more important, with higher feature importance. For both models, each feature obtained 20 feature importance values with 20 times the MCCV. We summed all the feature importance values for each feature and obtained a rank for all features.</p>
      </sec>
      <sec>
        <title>Model Interpretation</title>
        <p>One disadvantage of machine learning is that the model usually runs as a black box. However, it is necessary for a doctor to understand the reasons why a model makes such a prediction in the clinic, especially when timely detection is necessary. Tree-based models can provide feature importance at a global level but not in a specific case. The local interpretable model-agnostic explanations (LIME) algorithm is developed to identify an interpretable model that is locally faithful for each individual prediction [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. It provides relative feature contributions for a single instance of the prediction result. LIME generates neighborhood data by randomly perturbing features from the instance. It then learns locally weighted linear models on this neighborhood data to explain each of the classes in an interpretable way. Parameters in LIME mainly include the maximum number of features in explanation, number of neighborhood samples to generate, and machine learning prediction function. We used the LIME library from the original authors for the model interpretation. The number of neighborhood samples is 5000 by default. The parameter num_features (maximum number of features) is the number of features shown in the explanation. The default value is 10. In our study, the value was 9 for a clear layout, as the contributions of features ranked after 9 were almost zero.</p>
        <p>In our study, we used a submodular pick [<xref ref-type="bibr" rid="ref27">27</xref>] instead of a random pick to select a diverse, representative set of samples from the test set for nonredundant explanations. For these samples, we then obtained the class probabilities, and the representative individuals were assigned with and average weight contributed by each feature to display how the classifier made a decision. Finally, we went over all these LIME results together with the endocrinologists to decide whether we should trust the results of the model.</p>
        <p>All computation and visualization were performed in Python [<xref ref-type="bibr" rid="ref19">19</xref>] using packages like Scikit-learn, Pandas, Lime, and Matplotlib.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Training and validation process of prediction models. AUC: area under receiver operating characteristic; XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11728_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Subject Characteristics</title>
        <p>Among the 1757 girls included in our study, 966 were positive for the GnRHa-stimulation test and diagnosed with CPP; the remaining 791 girls showed a negative response to the test. As shown in <xref ref-type="table" rid="table1">Table 1</xref>, 16 of the 19 variables were significantly higher in the CPP group than in the non-CPP group (<italic>P</italic>&lt;.05), whereas prolactin, BMI, and pigmentation were similar in both groups.</p>
      </sec>
      <sec>
        <title>Evaluation for Models</title>
        <p>First, we developed prediction models with the data of 19 clinical and laboratory variables (<xref ref-type="table" rid="table1">Table 1</xref>) from all 1757 patients. Two machine learning algorithms, XGBoost and random forest classifiers, were used, and parameters with the best AUC were selected for each model. The performance as well as the selected parameters of the models are listed in <xref ref-type="table" rid="table2">Table 2</xref>, and their receiver operating characteristic (ROC) curves are plotted in <xref ref-type="fig" rid="figure2">Figure 2</xref>. The performance was evaluated on the 20 test sets split with MCCV. Both models had strong prediction powers, with a specificity of ≥84.32%, a sensitivity of ≥77.91%, and an AUC of ≥0.88. The XGBoost classifier is slightly more effective than the random forest classifier, especially in terms of the specificity (<italic>P</italic>&lt;.01), whereas random forest is much more efficient in terms of the computation speed with less model complexity.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Basic characteristics of girls who underwent the GnRHa-stimulation test.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="430"/>
            <col width="250"/>
            <col width="220"/>
            <col width="100"/>
            <thead>
              <tr valign="bottom">
                <td>Variables</td>
                <td>Non-CPP<sup>a</sup> (n=966), mean (SD)</td>
                <td>CPP (n=791), mean (SD)</td>
                <td><italic>P</italic> value<sup>b</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age (years)</td>
                <td>7.07 (1.11)</td>
                <td>7.52 (0.99)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>LH<sup>c</sup> (IU/L)</td>
                <td>0.12 (0.23)</td>
                <td>0.93 (1.28)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>FSH<sup>d</sup> (IU/L)</td>
                <td>1.82 (1.30)</td>
                <td>3.01 (1.62)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>GH<sup>e</sup> (ng/mL)</td>
                <td>3.27 (3.26)</td>
                <td>4.75 (4.69)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>IGF-I<sup>f</sup> (ng/mL)</td>
                <td>231.35 (65.93)</td>
                <td>317.87 (89.84)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>IGFBP-3<sup>g</sup> (μg/mL)</td>
                <td>4.55 (0.52)</td>
                <td>4.81 (0.55)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Estradiol (pmol/L)</td>
                <td>102.56 (50.96)</td>
                <td>125.81 (60.97)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Prolactin (ng/mL)</td>
                <td>8.73 (5.39)</td>
                <td>8.59 (5.61)</td>
                <td>.52</td>
              </tr>
              <tr valign="top">
                <td>Testosterone (nmol/L)</td>
                <td>0.80 (0.39)</td>
                <td>0.94 (0.49)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>History<sup>h</sup> (months)</td>
                <td>7.67 (10.39)</td>
                <td>9.27 (9.63)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Menstruation/menarche (yes, no)</td>
                <td>N/A<sup>i</sup></td>
                <td>N/A</td>
                <td>.03</td>
              </tr>
              <tr valign="top">
                <td>Height<sup>j</sup> (cm)</td>
                <td>127.16 (8.61)</td>
                <td>131.61 (8.42)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Weight<sup>j</sup> (kg)</td>
                <td>27.32 (5.32)</td>
                <td>29.60 (4.95)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>BMI<sup>k</sup> (kg/m<sup>2</sup>)</td>
                <td>16.73 (2.30)</td>
                <td>16.91 (1.96)</td>
                <td>.34</td>
              </tr>
              <tr valign="top">
                <td>Breast core (yes, no)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>Pubes<sup>l</sup> (1-5)</td>
                <td>1.06 (0.27)</td>
                <td>1.14 (0.44)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Pigmentation (yes, no)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>.87</td>
              </tr>
              <tr valign="top">
                <td>Left breast<sup>l</sup> (1-5)</td>
                <td>2.33 (0.84)</td>
                <td>2.76 (0.92)</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>Right breast<sup>l</sup> (1-5)</td>
                <td>2.32 (0.84)</td>
                <td>2.78 (0.92)</td>
                <td>&lt;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>CPP: central precocious puberty.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>The equality of each indicator was evaluated by Chi-square or Student  <italic>t</italic> test. <italic>P</italic>&lt;.05 was considered significant.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>LH: luteinizing hormone.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>FSH: follicle-stimulation hormone.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>GH: growth hormone.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>IGF-I: insulin-like growth factor-I.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>IGFBP-3: insulin-like growth factor binding protein-3.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>Abnormal duration in records.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table1fn10">
              <p><sup>j</sup>At stimulation test.</p>
            </fn>
            <fn id="table1fn11">
              <p><sup>k</sup>BMI: body mass index.</p>
            </fn>
            <fn id="table1fn12">
              <p><sup>l</sup>Tanner stage.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Predictive performance of classifiers and the corresponding parameters. A paired <italic>t</italic> test was performed on specificity and sensitivity for comparison against XGBoost.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="150"/>
            <col width="150"/>
            <col width="110"/>
            <col width="390"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Algorithms/Variables</td>
                <td>Specificity<sup>a</sup> (%), <break/>mean (SD)</td>
                <td>Sensitivity<sup>b</sup> (%), <break/>mean (SD)</td>
                <td>AUC<sup>c</sup>, <break/>mean (SD)</td>
                <td>Parameters</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6"><bold>19 variables, 1757 patients</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>XGBoost<sup>d</sup></td>
                <td>85.39 (1.38)</td>
                <td>77.94 (3.50)</td>
                <td>0.89 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Random forest</td>
                <td>84.32 (1.88)<sup>e</sup></td>
                <td>77.91 (3.59)<sup>f</sup></td>
                <td>0.88 (0.02)</td>
                <td>Max depth=3, criterion=gini, number of trees=20</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>SVM<sup>g</sup></td>
                <td>88.94 (1.76)<sup>e</sup></td>
                <td>62.36 (4.12)<sup>e</sup></td>
                <td>0.86 (0.04)</td>
                <td>Kernel=linear, penalty coefficient=5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Decision tree</td>
                <td>75.90 (2.47)<sup>e</sup></td>
                <td>71.71 (3.99)<sup>e</sup></td>
                <td>0.74 (0.02)</td>
                <td>Criterion=entropy</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>19 variables, 436 patients</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>XGBoost</td>
                <td>83.17 (5.29)</td>
                <td>75.28 (6.43)</td>
                <td>0.86 (0.04)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Random forest</td>
                <td>83.46 (6.28)<sup>f</sup></td>
                <td>74.72 (6.43)<sup>f</sup></td>
                <td>0.85 (0.04)</td>
                <td>Max depth=3, criterion=gini, number of trees=20</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>SVM</td>
                <td>88.94 (4.90)<sup>e</sup></td>
                <td>62.36 (7.73)<sup>e</sup></td>
                <td>0.86 (0.02)</td>
                <td>Kernel=linear, penalty coefficient=5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Decision tree</td>
                <td>76.25 (7.07)<sup>e</sup></td>
                <td>68.06 (7.12)<sup>e</sup></td>
                <td>0.72 (0.04)</td>
                <td>Criterion=entropy</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>25 variables, 436 patients</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>XGBoost<sup>d</sup></td>
                <td>87.66 (5.52)</td>
                <td>76.64 (6.51)</td>
                <td>0.90 (0.04)</td>
                <td>Learning rate=0.01, max depth=4, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Random forest</td>
                <td>87.41 (4.22)<sup>f</sup></td>
                <td>75.03 (7.91)<sup>f</sup></td>
                <td>0.90 (0.05)</td>
                <td>Max depth=3, criterion=entropy, number of trees=20</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>SVM</td>
                <td>89.81 (4.28)<sup>f</sup></td>
                <td>66.53 (7.01)<sup>e</sup></td>
                <td>0.86 (0.02)</td>
                <td>Kernel=linear, penalty coefficient=5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Decision tree</td>
                <td>76.35 (5.51)<sup>e</sup></td>
                <td>68.61 (7.16)<sup>e</sup></td>
                <td>0.72 (0.05)</td>
                <td>Criterion=entropy</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>1-3 variables, 1757 patients, XGBoost<sup>d</sup></bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>LH<sup>h</sup>, IGF-I<sup>i</sup>, FSH<sup>j</sup></td>
                <td>83.17 (1.62)</td>
                <td>76.39 (3.57)</td>
                <td>0.86 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>LH<sup>h</sup>, IGF-I<sup>i</sup></td>
                <td>83.27 (1.62)</td>
                <td>75.69 (3.61)</td>
                <td>0.86 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>LH<sup>h</sup>, FSH<sup>j</sup></td>
                <td>83.56 (1.94)</td>
                <td>75.83 (3.13)</td>
                <td>0.84 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>LH<sup>h</sup></td>
                <td>83.37 (2.00)</td>
                <td>75.97 (3.74)</td>
                <td>0.84 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>IGF-I<sup>i</sup>, FSH<sup>j</sup></td>
                <td>80.77 (2.47)</td>
                <td>57.08 (3.29)</td>
                <td>0.77 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>IGF-I<sup>i</sup></td>
                <td>80.19 (3.14)</td>
                <td>53.19 (4.55)</td>
                <td>0.73 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>FSH<sup>j</sup></td>
                <td>84.13 (3.87)</td>
                <td>45.00 (5.34)</td>
                <td>0.68 (0.02)</td>
                <td>Learning rate=0.01, max depth=3, number of trees=500</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Specificity=number of true negatives/(number of true negatives+number of false positives).</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Sensitivity=number of true positives/(number of true positives+number of false negatives).</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>AUC, area under the receiver operating curve.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup><italic>P</italic>&lt;.01</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>Not significant.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>SVM: supported vector machines.</p>
            </fn>
            <fn id="table2fn8">
              <p><sup>h</sup>LH: luteinizing hormone.</p>
            </fn>
            <fn id="table2fn9">
              <p><sup>i</sup>IGF-I: insulin-like growth factor-I.</p>
            </fn>
            <fn id="table2fn10">
              <p><sup>j</sup>FSH: follicle-stimulation hormone.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>In the data set, 436 girls had additional examination reports, and we extracted six variables from these reports (see Population and Variables subsection). To investigate whether adding image features could enhance the prediction efficiency, we combined the six variables with the 19 variables and trained and evaluated both the XGBoost and random forest models on the 436 samples, of which 180 patients belonged to the CPP group and 256 belonged to the non-CPP group. For the ease of comparison, we retrained the previous 19-variable models with the 436 samples. As shown in <xref ref-type="table" rid="table2">Table 2</xref>, the reduction in sample size led to a serious decline in model performance, whereas the addition of six image features improved their performance. Specifically, for XGBoost in 436 samples, the specificity increased from 83.17% for 19 variables to 87.66% for 25 variables, the sensitivity increased from 75.28% to 76.64%, and the AUC increased from 0.86 to 0.90. For random forest in 436 samples with 25 variables, the specificity increased from 83.46% to 87.41%, the sensitivity increased from 74.72% to 75.03%, and the AUC increased from 0.86 to 0.90 compared to the results from 436 samples with 19 variables. Similarly, as seen in the ROC curves shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>, XGBoost performed slightly better than the random forest classifier.</p>
        <p>To compare performance between ensemble models and nonensemble models, the SVM and decision tree classifiers were used to develop predictive models for the abovementioned settings. Higher specificities were achieved with the SVM models. However, sensitivities for the SVM models were much lower than those for the ensembles models. The decision tree models demonstrated significantly inferior performance in terms of almost all the sensitivities, specificities, and AUCs. These results suggest that the ensemble models are able to yield excellent performance while maintaining a good balance between sensitivity and specificity in the prediction of CPP.</p>
      </sec>
      <sec>
        <title>Feature Importance</title>
        <p>We computed the feature importance score for all the 19 variables to identify important features used by the models. The importance of each feature calculated by the models is plotted in <xref ref-type="fig" rid="figure3">Figure 3</xref>. In both models, the most important predictive variable was LH level, followed by IGF-I and FSH levels. The fourth most important feature for the random forest model was height, which ranked fifth in the XGBoost model. Prolactin is the fourth most important feature of XGBoost, but it contributed only a little to random forest. These data suggest that different machine learning algorithms attach importance to different combination lists of variables, although they yield similar predictive performance.</p>
        <p>In order to further verify the importance of the top 3 features, we constructed XGBoost models with these features individually or in combination (<xref ref-type="table" rid="table2">Table 2</xref>). As expected, the models using one, two, or three features had poorer performances than the models using all features. The results showed that the higher the feature ranked, the better the corresponding model performed. Interestingly, LH alone or together with IGF-I and FSH is sufficient to predict a response to the GnRHa test with a fairly good performance and an AUC between 0.84 and 0.86. These data support the results from the feature importance calculations.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>ROC curves for classifiers with 19 variables for 1757 patients and 25 variables for 436 patients. ROC: receiver operating curve; AUC: area under ROC.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11728_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Feature importance ranking for 19 variables in two classifiers calculated by the models. LH: luteinizing hormone; IGF-I: insulin-like growth factor-I; FSH: follicle-stimulation hormone; PRL: prolactin; GH: growth hormone; E2: estradiol; BMI: body mass index; TTE: testosterone; Rbreast: right breast; Lbreast: left breast; IGFBP-3: insulin-like growth factor binding protein-3; PMT: pigmentation; MST: menstruation.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11728_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Local Interpretable Model-Agnostic Explanations for Interpretation</title>
        <p>A representative set of 200 samples, which accounted for more than 50% of the test set and were enough to be the budget size of individual instances to understand a model, were selected with the submodular pick method [<xref ref-type="bibr" rid="ref27">27</xref>] for the 19-variable models. LIME was then applied to investigate feature contributions for each prediction. Results with top 9 features are presented in <xref ref-type="fig" rid="figure4">Figure 4</xref> for one positive sample and one negative sample (more representative samples can be seen in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). In <xref ref-type="fig" rid="figure4">Figure 4</xref>, XGBoost predicts an instance where CPP positively responds to the GnRHa test with a probability of 90%. Only the feature growth hormone supports the negative prediction, whereas LH, prolactin, IGF-I, and information about body development support the positive prediction. This makes sense in the clinical diagnosis of CPP and reveals that we can trust our prediction models to a certain extent. In <xref ref-type="fig" rid="figure4">Figure 4</xref>, left and right breast at Tanner stage 3, FSH level &gt; 2 IU/L, and several other features support the positive prediction with a probability of 16%. LH level of 0.07 IU/L, prolactin level &gt; 9.53 ng/mL, IGF-I level &gt; 220 ng/mL, and age &lt; 7 years contribute to the negative prediction with a probability of 84%. Similar results are observed in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Results of LIME with XGBoost and Random Forest classifiers applied to one positive (A, B) and one negative (C, D) instance. The left sides are for XGBoost, and the right for Random Forest. Blue color is for the negative instance and orange is for the positive instance. The first column represents the prediction probabilities of negative and positive results achieved from classifiers. The second column shows the features’ contributions to the probability. Only the top nine features are displayed for clarity. The third column displays the original data values. LIME: local interpretable model-agnostic explanations; XGBoost: extreme gradient boosting; LH: luteinizing hormone; IGF-I: insulin-like growth factor-I; FSH: follicle-stimulation hormone; PRL: prolactin; GH: growth hormone; E2: estradiol; BMI: body mass index; TTE: testosterone; Rbreast: right breast; Lbreast: left breast; IGFBP-3: insulin-like growth factor binding protein-3; PMT: pigmentation; MST: menstruation; PMT: pigmentation.</p>
          </caption>
          <graphic xlink:href="medinform_v7i1e11728_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview</title>
        <p>CPP mimics pubertal development ahead of time at an inappropriate chronological age. It requires timely detection and treatment in case of physical and physiological effect on girls. The GnRHa-stimulation test is expensive and time consuming and causes discomfort to patients. Here, we applied machine learning algorithms to multiple clinical variables and built two tree-based ensemble learning classifiers for the prediction of response to the GnRHa-stimulation test. Both the XGBoost and random forest models achieved good performance in distinguishing between positive and negative responses, with the AUC ranging from 0.88 to 0.90, the sensitivity ranging from 77.91% to 77.94%, and the specificity ranging from 84.32% to 87.66%.</p>
      </sec>
      <sec>
        <title>Comparisons with Previous Models</title>
        <p>Several previous models focused on determining optimal blood sampling time points or appropriate cut-off values to simplify the stimulation test. Kandemir et al [<xref ref-type="bibr" rid="ref29">29</xref>] found that a single sample of LH tested at the 40th minute after stimulation with a cut-off of 5 IU/L could yield 98% sensitivity and 100% specificity in the diagnosis of CPP. Yazdani et al [<xref ref-type="bibr" rid="ref30">30</xref>] showed that an LH concentration &gt; 5 IU/L at 3 hours has optimal sensitivity (83%) and specificity (97%). In the study of Çatlı et al [<xref ref-type="bibr" rid="ref7">7</xref>], 100% sensitivity and 84% specificity were obtained using a cut-off value &gt; 0.24 for peak LH/FSH ratio in girls. Although these models performed better than our models, they had to be used after stimulation and therefore could not avoid the disadvantages of the GnRH/GnRHa test completely.</p>
        <p>Some models used only the basal sex hormone level. Yazdani et al [<xref ref-type="bibr" rid="ref30">30</xref>] found that a basal LH level of &gt;0.1 IU/L, a basal LH/FSH ratio &gt;1, and basal estradiol level ≥1.5 ng/dL in girls have low sensitivity (10%-67%) but excellent specificity (94%-100%). Çatlı et al [<xref ref-type="bibr" rid="ref7">7</xref>] also reported models with the basal FSH or LH levels and achieved a sensitivity of 71% and a specificity of 68% or 64%. Pasternak et al [<xref ref-type="bibr" rid="ref3">3</xref>] reported that basal LH levels ≤ 0.1 IU/L were sufficient to rule out positive response to the GnRH test with a specificity of 94% but a sensitivity of only 64% in girls. In another model [<xref ref-type="bibr" rid="ref4">4</xref>], the basal LH level with a cut-off value of 0.35 IU/L was associated with a sensitivity of 63.96% and a specificity of 76.3% based on the ROC with an AUC of 0.77. These results varied a lot due to the different settings and sample sizes. In this study, our models showed better performance with more features before stimulation and a larger homogeneous population, which is the largest population in such a study to our knowledge.</p>
      </sec>
      <sec>
        <title>Predictive Features</title>
        <p>Based on our machine learning models, basal LH, IGF-I, and FSH levels are predictive factors with top ranks for the feature importance in both models. Previous studies have demonstrated that the measurement of LH could be better than that of other sex hormones for initial evaluation of suspected puberty [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. In our study, the LH level ranked first and was much more important than other variables. Besides LH, another indicator monitored in the stimulation test, FSH, was also selected by the models as the third most–important variable. Obviously, LH and FSH are important to CPP because they are biomarkers of the hypothalamic-pituitary-gonadal axis activation, which is the essence of CPP. IGF-I, which is the second most important variable in our models, is reportedly involved in GnRH regulation [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>] and is increasingly expressed in girls with CPP [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Animal studies showed that the IGF-I signaling pathways play important roles in the timing of puberty in girls [<xref ref-type="bibr" rid="ref32">32</xref>]. Although IGF-I has not been considered in previous models, our study suggests that IGF-I may be a valuable marker for diagnosing CPP.</p>
        <p>Several studies [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>] suggested that image reports like pelvic ultrasound and radiography of the hand have adjunct diagnostic values in CPP diagnosis but provide no reliable differentiation alone. Here, we found that adding features from the image reports improved the prediction results. Performance of models built based on 1757 samples was better than that based on 436 samples, suggesting a sample size effect. Interestingly, in the case of 436 samples with additional six image variables, the aforementioned sample size effect was balanced. This suggests that more samples with image features will produce better results. Thus, medical image examinations like bone age radiography should be considered before the GnRHa-stimulation test for girls with suspected CPP.</p>
      </sec>
      <sec>
        <title>Interpretations of Models</title>
        <p>We noticed that more variables were assigned with a moderate value of feature importance in the XGBoost model than those in the random forest model. This is reasonable when considering the different algorithms the two models used for prediction and importance evaluation. In XGBoost, trees are sequentially built in a boosting manner to enhance the overall performance. The estimates of feature importance are provided explicitly with the frequency that the feature is selected as a tree node from a trained predictive model. In contrast, trees are trained parallelly in a bootstrapping way in random forest to vote for the final decision. The feature importance is estimated implicitly through permuting the feature’s values and calculating the change of the model’s prediction error. Obviously, XGBoost includes each contribution of each feature to each tree into the feature importance, whereas random forest only evaluates each feature globally without specific contributions. It should be noted that different combinations of variables may produce models with similar predictive accuracy, relating to the uncertainty analysis of the solutions in any decision-making problem [<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. This is not rare in machine learning models in medicine [<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. Moreover, the most important features in the clinic such as basal LH, IGF-I, and FSH levels were all sorted out by both models, demonstrating that they are both reliable and effective in predicting response to the GnRHa test.</p>
        <p>In order to provide endocrinology physicians a trustworthy insight into the prediction models, we also used LIME to show each feature’s contribution to predicting probabilities reasonably. The most important features used by the models for individual prediction have been proven to be significant in the clinic [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], demonstrating that our models are credible. This will greatly increase the interpretability of the machine learning models and make it convenient for individualized diagnosis in the clinic.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are some limitations to this study. First, growth velocity is specially related to physical development. Due to the lack of height growth rate and weight growth rate, we did not include growth velocity in our feature set. For further research, we will focus more on medical imaging and growth velocity to identify their diagnostic value with CPP. Second, our work included only girls with suspected CPP from a single center in China. The prediction models in this study may not be suitable for the population in other districts or countries. Third, manual inspection of values extracted through regular expression matching from free text could reduce errors to improve the model performance. However, this adds a considerable amount of work and thus reduces the scalability of the model. We are improving the matching algorithm with the manually inspected data to increase the level of model automation. Finally, features generated from laboratory results are more complete than those extracted from free text, which may affect the rank of feature importance. More efforts are required to enhance the data quality of unstructured features in the future.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our study is the first one to apply both machine learning algorithms and the explanation method to the diagnosis of CPP. Our models can predict the response to the stimulation test before injection of GnRHa in girls who are suspected of having CPP and thus may be used as a prescreening tool to help physicians make decisions in conjunction with the GnRHa-stimulation test.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Results of LIME with XGBoost and Random Forest classifiers applied to four positive and four negative instances. LIME: local interpretable model-agnostic explanations.</p>
        <media xlink:href="medinform_v7i1e11728_app1.pdf" xlink:title="PDF File (Adobe PDF File), 267KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BMI</term>
          <def>
            <p>body mass index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CPP</term>
          <def>
            <p>central precocious puberty </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">FSH</term>
          <def>
            <p>follicle-stimulation hormone</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">GnRH</term>
          <def>
            <p>gonadotropin releasing hormone </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GnRHa</term>
          <def>
            <p>gonadotropin releasing hormone analogues </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IGF-I</term>
          <def>
            <p>insulin-like growth factor-I</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">IGFBP-3</term>
          <def>
            <p>insulin-like growth factor binding protein-3 </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LH</term>
          <def>
            <p>luteinizing hormone </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">LIME</term>
          <def>
            <p>local interpretable model-agnostic explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MCCV</term>
          <def>
            <p>Monte Carlo cross-validation </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">OOB</term>
          <def>
            <p>out-of-bag </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">ROC</term>
          <def>
            <p> receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">SVM</term>
          <def>
            <p>supported vector machines </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">XGBoost</term>
          <def>
            <p>extreme gradient boosting </p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by Guangzhou Institute of Pediatrics, Guangzhou Women and Children’s Medical Center (Grant #KCP-2016-002).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>HL and XL proposed the project and provided supervision. LP is responsible for data collection, project implementation, and manuscript drafting and revision. GL implemented the project and performed manuscript editing. XM provided clinical guidance and revised the manuscript. HL conducted part of the data collection and statistical analysis. JZ helped collect part of the data. All authors reviewed the manuscript in its final form.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Abreu</surname>
            <given-names>AP</given-names>
          </name>
          <name name-style="western">
            <surname>Kaiser</surname>
            <given-names>UB</given-names>
          </name>
        </person-group>
        <article-title>Pubertal development and regulation</article-title>
        <source>Lancet Diabetes Endocrinol</source>  
        <year>2016</year>  
        <month>03</month>  
        <volume>4</volume>  
        <issue>3</issue>  
        <fpage>254</fpage>  
        <lpage>264</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26852256"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/S2213-8587(15)00418-0</pub-id>
        <pub-id pub-id-type="medline">26852256</pub-id>
        <pub-id pub-id-type="pii">S2213-8587(15)00418-0</pub-id>
        <pub-id pub-id-type="pmcid">PMC5192018</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Houk</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kunselman</surname>
            <given-names>Allen R</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Peter A</given-names>
          </name>
        </person-group>
        <article-title>The diagnostic value of a brief GnRH analogue stimulation test in girls with central precocious puberty: a single 30-minute post-stimulation LH sample is adequate</article-title>
        <source>J Pediatr Endocrinol Metab</source>  
        <year>2008</year>  
        <month>12</month>  
        <volume>21</volume>  
        <issue>12</issue>  
        <fpage>1113</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="medline">19189683</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pasternak</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Friger</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Loewenthal</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Haim</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Hershkovitz</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>The utility of basal serum LH in prediction of central precocious puberty in girls</article-title>
        <source>Eur J Endocrinol</source>  
        <year>2012</year>  
        <month>02</month>  
        <volume>166</volume>  
        <issue>2</issue>  
        <fpage>295</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.eje-online.org/cgi/pmidlookup?view=long&amp;pmid=22084156"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1530/EJE-11-0720</pub-id>
        <pub-id pub-id-type="medline">22084156</pub-id>
        <pub-id pub-id-type="pii">EJE-11-0720</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ding</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Shen</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of basal sex hormone levels for activation of the hypothalamic-pituitary-gonadal axis</article-title>
        <source>J Pediatr Endocrinol Metab</source>  
        <year>2018</year>  
        <month>03</month>  
        <day>28</day>  
        <volume>31</volume>  
        <issue>3</issue>  
        <fpage>323</fpage>  
        <lpage>329</lpage>  
        <pub-id pub-id-type="doi">10.1515/jpem-2017-0124</pub-id>
        <pub-id pub-id-type="medline">29466239</pub-id>
        <pub-id pub-id-type="pii">/j/jpem.ahead-of-print/jpem-2017-0124/jpem-2017-0124.xml</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sørensen</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Aksglaede</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Petersen</surname>
            <given-names>JH</given-names>
          </name>
          <name name-style="western">
            <surname>Andersson</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Juul</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Serum IGF1 and insulin levels in girls with normal and precocious puberty</article-title>
        <source>Eur J Endocrinol</source>  
        <year>2012</year>  
        <month>05</month>  
        <volume>166</volume>  
        <issue>5</issue>  
        <fpage>903</fpage>  
        <lpage>10</lpage>  
        <pub-id pub-id-type="doi">10.1530/EJE-12-0106</pub-id>
        <pub-id pub-id-type="medline">22379117</pub-id>
        <pub-id pub-id-type="pii">EJE-12-0106</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Houk</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kunselman</surname>
            <given-names>AR</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>PA</given-names>
          </name>
        </person-group>
        <article-title>Adequacy of a single unstimulated luteinizing hormone level to diagnose central precocious puberty in girls</article-title>
        <source>Pediatrics</source>  
        <year>2009</year>  
        <month>06</month>  
        <volume>123</volume>  
        <issue>6</issue>  
        <fpage>e1059</fpage>  
        <lpage>63</lpage>  
        <pub-id pub-id-type="doi">10.1542/peds.2008-1180</pub-id>
        <pub-id pub-id-type="medline">19482738</pub-id>
        <pub-id pub-id-type="pii">123/6/e1059</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Çatlı</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Erdem</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Anık</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Abacı</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Böber</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Clinical and laboratory findings in the differential diagnosis of central precocious puberty and premature thelarche</article-title>
        <source>Turk Pediatri Ars</source>  
        <year>2015</year>  
        <month>03</month>  
        <volume>50</volume>  
        <issue>1</issue>  
        <fpage>20</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26078693"/>
        </comment>  
        <pub-id pub-id-type="doi">10.5152/tpa.2015.2281</pub-id>
        <pub-id pub-id-type="medline">26078693</pub-id>
        <pub-id pub-id-type="pii">tpa-50-1-20</pub-id>
        <pub-id pub-id-type="pmcid">PMC4462323</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mogensen</surname>
            <given-names>SS</given-names>
          </name>
          <name name-style="western">
            <surname>Aksglaede</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Mouritsen</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sørensen</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Main</surname>
            <given-names>KM</given-names>
          </name>
          <name name-style="western">
            <surname>Gideon</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Juul</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Diagnostic work-up of 449 consecutive girls who were referred to be evaluated for precocious puberty</article-title>
        <source>J Clin Endocrinol Metab</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>96</volume>  
        <issue>5</issue>  
        <fpage>1393</fpage>  
        <lpage>401</lpage>  
        <pub-id pub-id-type="doi">10.1210/jc.2010-2745</pub-id>
        <pub-id pub-id-type="medline">21346077</pub-id>
        <pub-id pub-id-type="pii">jc.2010-2745</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nam</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Rhie</surname>
            <given-names>YJ</given-names>
          </name>
          <name name-style="western">
            <surname>Son</surname>
            <given-names>CS</given-names>
          </name>
          <name name-style="western">
            <surname>Park</surname>
            <given-names>SH</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Factors to predict positive results of gonadotropin releasing hormone stimulation test in girls with suspected precocious puberty</article-title>
        <source>J Korean Med Sci</source>  
        <year>2012</year>  
        <month>02</month>  
        <volume>27</volume>  
        <issue>2</issue>  
        <fpage>194</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://jkms.org/DOIx.php?id=10.3346/jkms.2012.27.2.194"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3346/jkms.2012.27.2.194</pub-id>
        <pub-id pub-id-type="medline">22323868</pub-id>
        <pub-id pub-id-type="pmcid">PMC3271294</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Suh</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Kwon</surname>
            <given-names>AR</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>YJ</given-names>
          </name>
          <name name-style="western">
            <surname>Jeong</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Ahn</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Chae</surname>
            <given-names>HW</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>DH</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Factors that predict a positive response on gonadotropin-releasing hormone stimulation test for diagnosing central precocious puberty in girls</article-title>
        <source>Ann Pediatr Endocrinol Metab</source>  
        <year>2013</year>  
        <month>12</month>  
        <volume>18</volume>  
        <issue>4</issue>  
        <fpage>202</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://e-apem.org/journal/view.php?doi=10.6065/apem.2013.18.4.202"/>
        </comment>  
        <pub-id pub-id-type="doi">10.6065/apem.2013.18.4.202</pub-id>
        <pub-id pub-id-type="medline">24904878</pub-id>
        <pub-id pub-id-type="pmcid">PMC4027085</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>GM</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Advanced bone age as an indicator facilitates the diagnosis of precocious puberty</article-title>
        <source>J Pediatr (Rio J)</source>  
        <year>2018</year>  
        <volume>94</volume>  
        <issue>1</issue>  
        <fpage>69</fpage>  
        <lpage>75</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0021-7557(16)30375-8"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jped.2017.03.010</pub-id>
        <pub-id pub-id-type="medline">28866322</pub-id>
        <pub-id pub-id-type="pii">S0021-7557(16)30375-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>SH</given-names>
          </name>
          <name name-style="western">
            <surname>Joo</surname>
            <given-names>EY</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Jun</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>The Diagnostic Value of Pelvic Ultrasound in Girls with Central Precocious Puberty</article-title>
        <source>Chonnam Med J</source>  
        <year>2016</year>  
        <month>01</month>  
        <volume>52</volume>  
        <issue>1</issue>  
        <fpage>70</fpage>  
        <lpage>4</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://cmj.ac.kr/DOIx.php?id=10.4068/cmj.2016.52.1.70"/>
        </comment>  
        <pub-id pub-id-type="doi">10.4068/cmj.2016.52.1.70</pub-id>
        <pub-id pub-id-type="medline">26866003</pub-id>
        <pub-id pub-id-type="pmcid">PMC4742613</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Fan</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Jang</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Hwang</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of characteristics of the craniofacial complex and dental maturity in girls with central precocious puberty</article-title>
        <source>Angle Orthod</source>  
        <year>2018</year>  
        <month>04</month>  
        <day>30</day>  
        <pub-id pub-id-type="doi">10.2319/112317-809.1</pub-id>
        <pub-id pub-id-type="medline">29708396</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baik</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>SJ</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>JH</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>JH</given-names>
          </name>
        </person-group>
        <article-title>Predictive Value of Dental Maturity for a Positive Gonadotropin-Releasing Hormone Stimulation Test Result in Girls with Precocious Puberty</article-title>
        <source>J Korean Med Sci</source>  
        <year>2017</year>  
        <month>02</month>  
        <volume>32</volume>  
        <issue>2</issue>  
        <fpage>296</fpage>  
        <lpage>302</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://jkms.org/DOIx.php?id=10.3346/jkms.2017.32.2.296"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3346/jkms.2017.32.2.296</pub-id>
        <pub-id pub-id-type="medline">28049241</pub-id>
        <pub-id pub-id-type="pii">32.296</pub-id>
        <pub-id pub-id-type="pmcid">PMC5219996</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <collab>Subspecialty Group of Endocrinologic‚ Hereditary and Metabolic Diseases‚ the Society of Pediatrics‚ Chinese Medical Association</collab>
          <collab>Editorial Board‚ Chinese Journal of Pediatrics</collab>
        </person-group>
        <article-title>[Consensus statement For the diagnosis and treatment of central precocious puberty (2015)]</article-title>
        <source>Zhonghua Er Ke Za Zhi</source>  
        <year>2015</year>  
        <month>06</month>  
        <volume>53</volume>  
        <issue>6</issue>  
        <fpage>412</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="medline">26310550</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Carel</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Eugster</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Rogol</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ghizzoni</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Palmert</surname>
            <given-names>MR</given-names>
          </name>
          <collab>ESPE-LWPES GnRH Analogs Consensus Conference Group</collab>
          <name name-style="western">
            <surname>Antoniazzi</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Berenbaum</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Bourguignon</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chrousos</surname>
            <given-names>GP</given-names>
          </name>
          <name name-style="western">
            <surname>Coste</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Deal</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>de</surname>
            <given-names>VL</given-names>
          </name>
          <name name-style="western">
            <surname>Foster</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Heger</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Holland</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Jahnukainen</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Juul</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Kaplowitz</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Lahlou</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Merke</surname>
            <given-names>DP</given-names>
          </name>
          <name name-style="western">
            <surname>Neely</surname>
            <given-names>EK</given-names>
          </name>
          <name name-style="western">
            <surname>Oostdijk</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Phillip</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rosenfield</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Shulman</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Styne</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Tauber</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wit</surname>
            <given-names>JM</given-names>
          </name>
        </person-group>
        <article-title>Consensus statement on the use of gonadotropin-releasing hormone analogs in children</article-title>
        <source>Pediatrics</source>  
        <year>2009</year>  
        <month>04</month>  
        <volume>123</volume>  
        <issue>4</issue>  
        <fpage>e752</fpage>  
        <lpage>62</lpage>  
        <pub-id pub-id-type="doi">10.1542/peds.2008-1783</pub-id>
        <pub-id pub-id-type="medline">19332438</pub-id>
        <pub-id pub-id-type="pii">peds.2008-1783</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ibáñez</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Potau</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Zampolli</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Virdis</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Gussinyé</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Carrascosa</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Saenger</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Vicens-Calvet</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Use of leuprolide acetate response patterns in the early diagnosis of pubertal disorders: comparison with the gonadotropin-releasing hormone test</article-title>
        <source>J Clin Endocrinol Metab</source>  
        <year>1994</year>  
        <month>01</month>  
        <volume>78</volume>  
        <issue>1</issue>  
        <fpage>30</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.1210/jcem.78.1.7507123</pub-id>
        <pub-id pub-id-type="medline">7507123</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bayley</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Pinneau</surname>
            <given-names>SR</given-names>
          </name>
        </person-group>
        <article-title>Tables for predicting adult height from skeletal age: Revised for use with the greulich-pyle hand standards</article-title>
        <source>The Journal of Pediatrics</source>  
        <year>1952</year>  
        <month>4</month>  
        <volume>40</volume>  
        <issue>4</issue>  
        <fpage>423</fpage>  
        <lpage>441</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0022-3476(52)80205-7</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
        <source>Python</source>  
        <access-date>2019-01-22</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.python.org/">https://www.python.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75cTVrNhZ"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Guestrin</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>XGBoost: A Scalable Tree Boosting System</article-title>
        <year>2016</year>  
        <month>08</month>  
        <day>13</day>  
        <conf-name>KDD '16 Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
        <conf-date>August 13-17, 2016</conf-date>
        <conf-loc>San Francisco, CA, USA</conf-loc>
        <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Torlay</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Perrone-Bertolotti</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Baciu</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Machine learning-XGBoost analysis of language networks to classify patients with epilepsy</article-title>
        <source>Brain Inform</source>  
        <year>2017</year>  
        <month>09</month>  
        <volume>4</volume>  
        <issue>3</issue>  
        <fpage>159</fpage>  
        <lpage>169</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1007/s40708-017-0065-7"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s40708-017-0065-7</pub-id>
        <pub-id pub-id-type="medline">28434153</pub-id>
        <pub-id pub-id-type="pii">10.1007/s40708-017-0065-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC5563301</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Calhoun</surname>
            <given-names>VD</given-names>
          </name>
          <name name-style="western">
            <surname>Fu</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Du</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Sui</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>An ensemble learning system for a 4-way classification of Alzheimer's disease and mild cognitive impairment</article-title>
        <source>J Neurosci Methods</source>  
        <year>2018</year>  
        <month>05</month>  
        <day>15</day>  
        <volume>302</volume>  
        <fpage>75</fpage>  
        <lpage>81</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jneumeth.2018.03.008</pub-id>
        <pub-id pub-id-type="medline">29578038</pub-id>
        <pub-id pub-id-type="pii">S0165-0270(18)30079-7</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liaw</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Wiener</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>R News</source>  
        <year>2002</year>  
        <month>12</month>  
        <access-date>2019-01-22</access-date>
        <comment>Classification and regression by randomForest 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/doc/Rnews/Rnews_2002-3.pdf">https://cran.r-project.org/doc/Rnews/Rnews_2002-3.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cYZwTh7"/></comment> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hearst</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dumais</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Osuna</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Platt</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Scholkopf</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Support vector machines</article-title>
        <source>IEEE Intell Syst Their Appl</source>  
        <year>1998</year>  
        <month>7</month>  
        <day>10</day>  
        <volume>13</volume>  
        <issue>4</issue>  
        <fpage>18</fpage>  
        <lpage>28</lpage>  
        <pub-id pub-id-type="doi">10.1109/5254.708428</pub-id>
        <pub-id pub-id-type="medline">21889629</pub-id>
        <pub-id pub-id-type="pii">S0003-2670(11)00968-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Safavian</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Landgrebe</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>A survey of decision tree classifier methodology</article-title>
        <source>IEEE Trans Syst Man Cybern</source>  
        <year>1991</year>  
        <volume>21</volume>  
        <issue>3</issue>  
        <fpage>660</fpage>  
        <lpage>674</lpage>  
        <pub-id pub-id-type="doi">10.1109/21.97458</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Monte Carlo cross validation</article-title>
        <source>Chemometrics and Intelligent Laboratory Systems</source>  
        <year>2001</year>  
        <month>4</month>  
        <volume>56</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>11</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0169-7439(00)00122-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ribeiro</surname>
            <given-names>MT</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Guestrin</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Why should i trust you? Explaining the predictions of any classifier</article-title>
        <year>2016</year>  
        <month>8</month>  
        <conf-name>KDD '16 Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
        <conf-date>August 13-17, 2016</conf-date>
        <conf-loc>San Francisco, California, USA</conf-loc>
        <fpage>E</fpage>  
        <pub-id pub-id-type="doi">10.1145/2939672.2939778</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Kumara</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Reich</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Explainable data-driven modeling of patient satisfaction survey data</article-title>
        <year>2017</year>  
        <month>12</month>  
        <conf-name>2017 IEEE International Conference on Big Data</conf-name>
        <conf-date>11-14 Dec. 2017</conf-date>
        <conf-loc>Boston, MA, USA</conf-loc>
        <publisher-name>IEEE</publisher-name>
        <pub-id pub-id-type="doi">10.1109/BigData.2017.8258391</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kandemir</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Demirbilek</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Özön</surname>
            <given-names>ZA</given-names>
          </name>
          <name name-style="western">
            <surname>Gönç</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Alikaşifoğlu</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>GnRH stimulation test in precocious puberty: single sample is adequate for diagnosis and dose adjustment</article-title>
        <source>J Clin Res Pediatr Endocrinol</source>  
        <year>2011</year>  
        <month>03</month>  
        <volume>3</volume>  
        <issue>1</issue>  
        <fpage>12</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.4274/jcrpe.v3i1.03"/>
        </comment>  
        <pub-id pub-id-type="doi">10.4274/jcrpe.v3i1.03</pub-id>
        <pub-id pub-id-type="medline">21448328</pub-id>
        <pub-id pub-id-type="pmcid">PMC3065310</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yazdani</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Raman</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Haymond</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>A single sample GnRHa stimulation test in the diagnosis of precocious puberty</article-title>
        <source>Int J Pediatr Endocrinol</source>  
        <year>2012</year>  
        <month>07</month>  
        <day>18</day>  
        <volume>2012</volume>  
        <issue>1</issue>  
        <fpage>23</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://ijpeonline.biomedcentral.com/articles/10.1186/1687-9856-2012-23"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1687-9856-2012-23</pub-id>
        <pub-id pub-id-type="medline">22809285</pub-id>
        <pub-id pub-id-type="pii">1687-9856-2012-23</pub-id>
        <pub-id pub-id-type="pmcid">PMC3438042</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wolfe</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Divall</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>The regulation of reproductive neuroendocrine function by insulin and insulin-like growth factor-1 (IGF-1)</article-title>
        <source>Front Neuroendocrinol</source>  
        <year>2014</year>  
        <month>10</month>  
        <volume>35</volume>  
        <issue>4</issue>  
        <fpage>558</fpage>  
        <lpage>72</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24929098"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.yfrne.2014.05.007</pub-id>
        <pub-id pub-id-type="medline">24929098</pub-id>
        <pub-id pub-id-type="pii">S0091-3022(14)00054-5</pub-id>
        <pub-id pub-id-type="pmcid">PMC4175134</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Divall</surname>
            <given-names>SA</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>TR</given-names>
          </name>
          <name name-style="western">
            <surname>Carver</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Koch</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Brüning</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Kahn</surname>
            <given-names>CR</given-names>
          </name>
          <name name-style="western">
            <surname>Wondisford</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Radovick</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wolfe</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Divergent roles of growth factors in the GnRH regulation of puberty in mice</article-title>
        <source>J Clin Invest</source>  
        <year>2010</year>  
        <month>08</month>  
        <volume>120</volume>  
        <issue>8</issue>  
        <fpage>2900</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1172/JCI41069"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1172/JCI41069</pub-id>
        <pub-id pub-id-type="medline">20628204</pub-id>
        <pub-id pub-id-type="pii">41069</pub-id>
        <pub-id pub-id-type="pmcid">PMC2912185</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>de Vries</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Phillip</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Role of pelvic ultrasound in girls with precocious puberty</article-title>
        <source>Horm Res Paediatr</source>  
        <year>2011</year>  
        <month>02</month>  
        <volume>75</volume>  
        <issue>2</issue>  
        <fpage>148</fpage>  
        <lpage>52</lpage>  
        <pub-id pub-id-type="doi">10.1159/000323361</pub-id>
        <pub-id pub-id-type="medline">21228561</pub-id>
        <pub-id pub-id-type="pii">000323361</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eksioglu</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Yilmaz</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Cetinkaya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Cinar</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Yildiz</surname>
            <given-names>YT</given-names>
          </name>
          <name name-style="western">
            <surname>Aycan</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Value of pelvic sonography in the diagnosis of various forms of precocious puberty in girls</article-title>
        <source>J Clin Ultrasound</source>  
        <year>2013</year>  
        <month>02</month>  
        <volume>41</volume>  
        <issue>2</issue>  
        <fpage>84</fpage>  
        <lpage>93</lpage>  
        <pub-id pub-id-type="doi">10.1002/jcu.22004</pub-id>
        <pub-id pub-id-type="medline">23124596</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fernández Martínez</surname>
            <given-names>Jl</given-names>
          </name>
          <name name-style="western">
            <surname>Fernández Muñiz</surname>
            <given-names>Mz</given-names>
          </name>
          <name name-style="western">
            <surname>Tompkins</surname>
            <given-names>Mj</given-names>
          </name>
        </person-group>
        <article-title>On the topography of the cost functional in linear and nonlinear inverse problems</article-title>
        <source>Geophysics</source>  
        <year>2012</year>  
        <month>01</month>  
        <volume>77</volume>  
        <issue>1</issue>  
        <fpage>W1</fpage>  
        <lpage>W15</lpage>  
        <pub-id pub-id-type="doi">10.1190/geo2011-0341.1</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Polikar</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Ensemble based systems in decision making</article-title>
        <source>IEEE Circuits Syst Mag</source>  
        <year>2006</year>  
        <month>9</month>  
        <volume>6</volume>  
        <issue>3</issue>  
        <fpage>21</fpage>  
        <lpage>45</lpage>  
        <pub-id pub-id-type="doi">10.1109/MCAS.2006.1688199</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fernández-Martínez</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Fernández-Muñiz</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Pallero</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pedruelo-González</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>From Bayes to Tarantola: New insights to understand uncertainty in inverse problems</article-title>
        <source>Journal of Applied Geophysics</source>  
        <year>2013</year>  
        <month>11</month>  
        <volume>98</volume>  
        <fpage>62</fpage>  
        <lpage>72</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jappgeo.2013.07.005</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>deAndrés-Galiana</surname>
            <given-names>EJ</given-names>
          </name>
          <name name-style="western">
            <surname>Fernández-Martínez</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Luaces</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Del</surname>
            <given-names>CJJ</given-names>
          </name>
          <name name-style="western">
            <surname>Huergo-Zapico</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Acebes-Huerta</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>González</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>González-Rodríguez</surname>
            <given-names>AP</given-names>
          </name>
        </person-group>
        <article-title>Analysis of clinical prognostic variables for Chronic Lymphocytic Leukemia decision-making problems</article-title>
        <source>J Biomed Inform</source>  
        <year>2016</year>  
        <month>04</month>  
        <volume>60</volume>  
        <fpage>342</fpage>  
        <lpage>51</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)00039-3"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2016.02.017</pub-id>
        <pub-id pub-id-type="medline">26956213</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(16)00039-3</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kosmicki</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sochat</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Duda</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wall</surname>
            <given-names>DP</given-names>
          </name>
        </person-group>
        <article-title>Searching for a minimal set of behaviors for autism detection through feature selection-based machine learning</article-title>
        <source>Transl Psychiatry</source>  
        <year>2015</year>  
        <month>02</month>  
        <day>24</day>  
        <volume>5</volume>  
        <fpage>e514</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25710120"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/tp.2015.7</pub-id>
        <pub-id pub-id-type="medline">25710120</pub-id>
        <pub-id pub-id-type="pii">tp20157</pub-id>
        <pub-id pub-id-type="pmcid">PMC4445756</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Zhuang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Xi</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Pan</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Cao</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Xia</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Developing a Machine Learning System for Identification of Severe Hand, Foot, and Mouth Disease from Electronic Medical Record Data</article-title>
        <source>Sci Rep</source>  
        <year>2017</year>  
        <month>11</month>  
        <day>27</day>  
        <volume>7</volume>  
        <issue>1</issue>  
        <fpage>16341</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/s41598-017-16521-z"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/s41598-017-16521-z</pub-id>
        <pub-id pub-id-type="medline">29180702</pub-id>
        <pub-id pub-id-type="pii">10.1038/s41598-017-16521-z</pub-id>
        <pub-id pub-id-type="pmcid">PMC5703994</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
