<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i7e24796</article-id>
      <article-id pub-id-type="pmid">34255684</article-id>
      <article-id pub-id-type="doi">10.2196/24796</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Machine Learning Methods for the Diagnosis of Chronic Obstructive Pulmonary Disease in Healthy Subjects: Retrospective Observational Cohort Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gandhi</surname>
            <given-names>Chintan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Muro</surname>
            <given-names>Shigeo</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7452-9191</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ishida</surname>
            <given-names>Masato</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9719-7863</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Horie</surname>
            <given-names>Yoshiharu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <address>
            <institution>Department of Data Science, Medical</institution>
            <institution>AstraZeneca KK</institution>
            <addr-line>3-1, Ofuka-cho, Kita-ku</addr-line>
            <addr-line>Osaka, 5300011</addr-line>
            <country>Japan</country>
            <phone>81 81 6 4802 3600</phone>
            <email>yoshiharu.horie@astrazeneca.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2609-2495</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Takeuchi</surname>
            <given-names>Wataru</given-names>
          </name>
          <degrees>MEng</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2515-1289</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Nakagawa</surname>
            <given-names>Shunki</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7933-668X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Ban</surname>
            <given-names>Hideyuki</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8785-0950</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Nakagawa</surname>
            <given-names>Tohru</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4129-3033</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Kitamura</surname>
            <given-names>Tetsuhisa</given-names>
          </name>
          <degrees>MD, MSc, DPH</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0107-0580</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Respiratory Medicine</institution>
        <institution>Nara Medical University</institution>
        <addr-line>Nara</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Respiratory and Immunology, Medical</institution>
        <institution>AstraZeneca KK</institution>
        <addr-line>Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Data Science, Medical</institution>
        <institution>AstraZeneca KK</institution>
        <addr-line>Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Center for Technology Innovation–Artificial Intelligence, Research &#38; Development Group</institution>
        <institution>Hitachi, Ltd</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Hitachi Health Care Center</institution>
        <institution>Hitachi, Ltd</institution>
        <addr-line>Ibaraki</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Division of Environmental Medicine and Population Sciences</institution>
        <institution>Department of Social and Environmental Medicine</institution>
        <institution>Graduate School of Medicine, Osaka University</institution>
        <addr-line>Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yoshiharu Horie <email>yoshiharu.horie@astrazeneca.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>7</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>7</issue>
      <elocation-id>e24796</elocation-id>
      <history>
        <date date-type="received">
          <day>5</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>28</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>17</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>11</day>
          <month>4</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Shigeo Muro, Masato Ishida, Yoshiharu Horie, Wataru Takeuchi, Shunki Nakagawa, Hideyuki Ban, Tohru Nakagawa, Tetsuhisa Kitamura. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 06.07.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/7/e24796" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Airflow limitation is a critical physiological feature in chronic obstructive pulmonary disease (COPD), for which long-term exposure to noxious substances, including tobacco smoke, is an established risk. However, not all long-term smokers develop COPD, meaning that other risk factors exist.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to predict the risk factors for COPD diagnosis using machine learning in an annual medical check-up database.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In this retrospective observational cohort study (ARTDECO [Analysis of Risk Factors to Detect COPD]), annual medical check-up records for all Hitachi Ltd employees in Japan collected from April 1998 to March 2019 were analyzed. Employees who provided informed consent via an opt-out model were screened and those aged 30 to 75 years without a prior diagnosis of COPD/asthma or a history of cancer were included. The database included clinical measurements (eg, pulmonary function tests) and questionnaire responses. To predict the risk factors for COPD diagnosis within a 3-year period, the Gradient Boosting Decision Tree machine learning (XGBoost) method was applied as a primary approach, with logistic regression as a secondary method. A diagnosis of COPD was made when the ratio of the prebronchodilator forced expiratory volume in 1 second (FEV<sub>1</sub>) to prebronchodilator forced vital capacity (FVC) was &#60;0.7 during two consecutive examinations.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Of the 26,101 individuals screened, 1213 met the exclusion criteria, and thus, 24,815 individuals were included in the analysis. The top 10 predictors for COPD diagnosis were FEV<sub>1</sub>/FVC, smoking status, allergic symptoms, cough, pack years, hemoglobin A<sub>1c</sub>, serum albumin, mean corpuscular volume, percent predicted vital capacity, and percent predicted value of FEV<sub>1</sub>. The areas under the receiver operating characteristic curves of the XGBoost model and the logistic regression model were 0.956 and 0.943, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Using a machine learning model in this longitudinal database, we identified a number of parameters as risk factors other than smoking exposure or lung function to support general practitioners and occupational health physicians to predict the development of COPD. Further research to confirm our results is warranted, as our analysis involved a database used only in Japan.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>chronic obstructive pulmonary disease</kwd>
        <kwd>airflow limitation</kwd>
        <kwd>medical check-up</kwd>
        <kwd>Gradient Boosting Decision Tree</kwd>
        <kwd>logistic regression</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Chronic obstructive pulmonary disease (COPD) is characterized by airflow limitation associated with persistent respiratory symptoms. Most patients with COPD experience exacerbation of symptoms and are at high risk of developing comorbidities such as cardiovascular disease [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
      <p>Long-term exposure to tobacco smoke, vapor, gas, dust, and fumes is an established major risk factor for COPD [<xref ref-type="bibr" rid="ref2">2</xref>]. However, only a small percentage of smokers develop airflow limitation, while nonsmokers can develop COPD [<xref ref-type="bibr" rid="ref3">3</xref>]. These inconsistencies indicate that risk factors other than long-term smoking are associated with COPD [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>The prevalence of COPD has been reported to be 12% to 13% among smokers [<xref ref-type="bibr" rid="ref5">5</xref>]. However, only 9.4% of patients with airflow limitation have a previous diagnosis of COPD, and European data indicate that up to 80% of COPD cases are undiagnosed [<xref ref-type="bibr" rid="ref6">6</xref>], suggesting delays in the diagnosis of COPD. The ARCTIC observational cohort study showed that late COPD diagnosis was associated with a higher exacerbation rate and increased comorbidities and costs compared with early diagnosis [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>To address the issue of undiagnosed COPD, significant risk factors for airflow limitation other than smoking should be identified and evaluated in routine clinical practice. In a cohort study of 9040 individuals from the Japanese general population, concomitant <italic>Chlamydia pneumoniae</italic> and <italic>Mycoplasma pneumoniae</italic> seropositivity was found to be an independent risk factor for airflow limitation [<xref ref-type="bibr" rid="ref8">8</xref>]. Additionally, Sato et al employed an annual health examination with pulmonary function tests measuring airflow limitation to identify undiagnosed patients with COPD among the Japanese population and found that iron deficiency might be associated with COPD development [<xref ref-type="bibr" rid="ref9">9</xref>]. However, the follow-up duration of these cohorts was short (&#60;3 years), limiting their ability to identify risk factors for COPD in the general population.</p>
      <p>A large questionnaire-based surveillance demonstrated some improvement in diagnostic rates for COPD; however, approximately 60% of eligible participants failed to respond to the questionnaire [<xref ref-type="bibr" rid="ref10">10</xref>]. While these results suggest that identifying robust and relevant risk factors is likely to improve early diagnosis, the slow progression and heterogeneity of the disease have hindered the identification of such risk factors for COPD development.</p>
      <p>The recently reported “Subtype and Stage Inference” machine learning computational model identified subtypes of patients with COPD [<xref ref-type="bibr" rid="ref11">11</xref>]. Compared with traditional approaches, the advantages of machine learning include the ability to process complex nonlinear relationships between predictors and to provide novel outputs. Therefore, the aim of this study was to apply machine learning methods to predict possible risk factors for the development of airflow limitation, an essential feature of COPD diagnosis, using a Japanese medical check-up database comprising data from a number of healthy subjects to support the early diagnosis of COPD by general practitioners and occupational health physicians.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design and Population</title>
        <p>This was a retrospective observational cohort study to predict the risk factors for COPD diagnosis in healthy individuals. The analysis data set comprised individuals aged ≥30 years who had undertaken more than two medical check-ups, had no history of lung cancer or asthma at the first medical check-up, and could be classified as either having a diagnosis of COPD or as not having COPD. This study was designed according to the <italic>Transparent Reporting of a Multivariate Prediction Model for Individual Prognosis or Diagnosis</italic> guidelines for prognostic studies [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>The study protocol was reviewed and approved by the ethics committee of MINS (a nonprofit organization in Tokyo, Japan) and the Research &#38; Development Group and Corporate Hospital Group of Hitachi, Ltd (Tokyo, Japan) prior to the start of data analysis. Individual informed consent was obtained using an opt-out model in agreement with the Institutional Review Board at Hitachi, Ltd. This study was conducted in accordance with the ethical principles of the Declaration of Helsinki.</p>
      </sec>
      <sec>
        <title>Data Source</title>
        <p>The data source was annual medical check-up data for all Hitachi employees from April 1998 to March 2019. Data were archived in a high-security server that was managed with limited access rights by Hitachi. The annual medical check-up includes clinical measurements and questionnaires to examine the health of employees (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Such questionnaires are utilized by Japanese organizations to evaluate their employees’ health and give advice about health promotion, such as giving up smoking and exercising regularly based on the second term of the National Health Promotion Movement in the 21st century (Health Japan 21) issued by the Ministry of Health, Labour, and Welfare in Japan [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      </sec>
      <sec>
        <title>Definition of COPD</title>
        <p>COPD was considered according to the lung function status at two consecutive measurements during an annual lung function test when the prebronchodilator (pre-BD) forced expiratory volume in 1 second/forced vital capacity (FEV<sub>1</sub>/FVC) was &#60;0.7, as previously employed in a large population-based cohort study [<xref ref-type="bibr" rid="ref14">14</xref>]. Individuals having a pre-BD FEV<sub>1</sub>/FVC ≥0.7 in at least three consecutive annual lung function test measurements were classified as non-COPD. For individuals with more than three records in the non-COPD group, the most recent three records were analyzed. Individuals having less than two lung function tests were excluded from all analyses. Spirometry was calibrated and performed by trained paramedical personnel according to the American Thoracic Society/European Respiratory Society guidelines [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <sec>
          <title>Age at COPD Diagnosis</title>
          <p>The age distribution for disease diagnosis was evaluated and stratified by smoking status (current smoker, exsmoker, or nonsmoker). The age at COPD diagnosis was defined as the age at the first of two consecutive measurements in which the pre-BD FEV<sub>1</sub>/FVC was &#60;0.7.</p>
        </sec>
        <sec>
          <title>Risk Factor Prediction Using Machine Learning</title>
          <p>Two types of models were constructed for predicting the risk factors for COPD diagnosis within 3 years as follows: a machine learning method (Gradient Boosting Decision Tree machine learning [XGBoost] [<xref ref-type="bibr" rid="ref17">17</xref>]) and an established statistical method (logistic regression [<xref ref-type="bibr" rid="ref18">18</xref>]). Individuals who did not meet the study inclusion criteria and/or had lung cancer/asthma were excluded from the analyses. Any individuals with missing data during the 3 years prior to the diagnosis year in the COPD group or during the most recent 3 years in the non-COPD group were excluded from the analyses. Propensity scores were calculated based on age, sex, smoking status, BMI, eosinophil count (EOS), and FEV<sub>1</sub>.</p>
          <p>Data were randomly divided into a training data set and a test data set at a ratio of 7:3, with the same ratio of COPD to non-COPD individuals. Propensity scoring was used to balance the characteristics of COPD and non-COPD individuals (caliper: 0.2) in the training and test data sets. Next, the training data set was randomly divided 8:2 for model construction (XGBoost and logistic) and evaluation of model performance, respectively. The data split, model construction, and evaluation processes were repeated five times for cross-validation (5-CV approach) [<xref ref-type="bibr" rid="ref19">19</xref>]. Model parameters, including the depth of the tree and regularization factor, were refined during performance evaluation by the 5-CV approach. Finally, the most optimal model was generated by applying the best parameters confirmed by the 5-CV approach. To evaluate model performance in the unlearned data, the most optimized model was used to evaluate the test data set.</p>
          <p>Model construction by logistic regression was performed in a similar way to the XGBoost method. Models were constructed in the training data set (randomly sampled data from the entire data set) and subsequently validated in the test data set after model evaluation.</p>
          <p>Following model construction, the area under the receiver operating characteristic curve (AUC), positive predictive value, sensitivity, specificity, and F1-measure were calculated for each model to evaluate the performance under both 5-CV and test conditions [<xref ref-type="bibr" rid="ref20">20</xref>]. The feature importance of the machine learning model was calculated to examine the contribution of each predictor to the model constructed using the Gini impurity method [<xref ref-type="bibr" rid="ref19">19</xref>]. The feature weight of the logistic regression model was also calculated. All analyses were performed using Python 3.6 software (Python Software Foundation).</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Individuals</title>
        <p>Data from 26,101 individuals (employees and their families) aged 30 to 75 years, who underwent annual check-ups between April 1998 and March 2019 were included in our analysis. The total number of medical check-up records was 318,568. All 26,101 individuals had lung function test measurements for 3 consecutive years. The medical records for 73 individuals aged &#60;30 years at the first medical check-up, 67 individuals with a history of cancer, and 727 individuals with a history of asthma were excluded, as were data from 419 individuals who had already been diagnosed with COPD (subjects for whom all data points of pre-BD FEV<sub>1</sub>/FVC were &#60;0.7 during the observational period) or had not been classified as either COPD or non-COPD (subjects with pre-BD FEV<sub>1</sub>/FVC &#60;0.7 without two consecutive measurements). Accordingly, data for 24,815 individuals (corresponding to 67,438 records) were included in the analyses (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow diagram of the study. COPD: chronic obstructive pulmonary disease.</p>
          </caption>
          <graphic xlink:href="medinform_v9i7e24796_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Baseline Characteristics</title>
        <p><xref ref-type="table" rid="table1">Table 1</xref> shows the baseline characteristics of the COPD and non-COPD groups. Overall, 1489 individuals were considered as having COPD (pre-BD FEV<sub>1</sub>/FVC &#60;0.7 at two consecutive measurements during annual lung function tests). In comparison with the non-COPD group, the COPD group had a lower BMI, worse lung function (pre-BD FEV<sub>1</sub>, pre-BD percent predicted value of FEV<sub>1</sub> [%FEV<sub>1</sub>], and pre-BD FEV<sub>1</sub>/FVC), and greater emphysematous change and chronic inflammation as determined by computed tomography. Furthermore, comorbidities, such as arrythmia, duodenal ulcer, colorectal polyp, angina, stomach ulcer, and kidney disease, were more prevalent in the COPD group. Statistically significant differences in hematological parameters (mean corpuscular volume [MCV], mean corpuscular hemoglobin concentration [MCHC], mean corpuscular hemoglobin [MCH], hemoglobin [Hb], and hematocrit [HT] [<xref ref-type="bibr" rid="ref15">15</xref>]) between the COPD and non-COPD groups were also observed. Inflammatory markers, particularly white blood cell (WBC) count and EOS, were also significantly higher in the COPD group.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Subject characteristics stratified by chronic obstructive pulmonary disease status.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="480"/>
            <col width="220"/>
            <col width="180"/>
            <col width="90"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Characteristic</td>
                <td>Non-COPD<sup>a</sup> (n=23,326)</td>
                <td>COPD (n=1489)</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>42 (9.1)</td>
                <td>48 (9.3)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Female, n (%)</td>
                <td>3841 (16.5%)</td>
                <td>58 (3.9%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Smoking status, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Current smoker</td>
                <td>10,632 (45.6%)</td>
                <td>1,021 (68.6%)</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Exsmoker</td>
                <td>3534 (15.2%)</td>
                <td>202 (13.6%)</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nonsmoker</td>
                <td>9153 (39.3%)</td>
                <td>266 (17.9%)</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unknown/missing</td>
                <td>7 (0.0%)</td>
                <td>0 (0.0%)</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="2">BMI (kg/m<sup>2</sup>), mean (SD)</td>
                <td>23 (3.2)</td>
                <td>22 (2.7)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Lung function test, mean (SD)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prebronchodilator FEV<sub>1</sub><sup>b</sup></td>
                <td>3.4 (0.7)</td>
                <td>3.1 (0.6)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prebronchodilator FVC<sup>c</sup></td>
                <td>4.1 (0.8)</td>
                <td>4.2 (0.8)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prebronchodilator FEV<sub>1</sub>/FVC</td>
                <td>83.7 (5.4)</td>
                <td>74.9 (5.1)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Comorbidity, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Arrythmia</td>
                <td>107 (0.5%)</td>
                <td>16 (1.1%)</td>
                <td>.003</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Duodenal ulcer</td>
                <td>158 (0.7%)</td>
                <td>19 (1.3%)</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Colorectal polyp</td>
                <td>43 (0.2%)</td>
                <td>13 (0.9%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Angina</td>
                <td>56 (0.2%)</td>
                <td>10 (0.7%)</td>
                <td>.006</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stomach ulcer</td>
                <td>180 (0.8%)</td>
                <td>29 (1.9%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kidney disease</td>
                <td>77 (0.3%)</td>
                <td>12 (0.8%)</td>
                <td>.01</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Computed tomography finding, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bulla, bleb</td>
                <td>108 (0.5%)</td>
                <td>31 (2.1%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Moderate emphysema</td>
                <td>18 (0.1%)</td>
                <td>13 (0.9%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mild emphysema</td>
                <td>96 (0.4%)</td>
                <td>27 (1.8%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Calcification of left anterior descending coronary artery</td>
                <td>128 (0.5%)</td>
                <td>16 (1.1%)</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chronic inflammation</td>
                <td>342 (1.5%)</td>
                <td>43 (2.9%)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Laboratory parameters, mean (SD)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Albumin (U/L)</td>
                <td>4.4 (0.2)</td>
                <td>4.3 (0.2)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Alanine aminotransferase (U/L)</td>
                <td>209.5 (53.7)</td>
                <td>215.2 (54.6)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aspartate aminotransferase (U/L)</td>
                <td>26.4 (14.8)</td>
                <td>24.3 (12.8)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Blood urea nitrogen (mg/dL)</td>
                <td>14.1 (3.2)</td>
                <td>14.7 (3.3)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cholinesterase (U/L)</td>
                <td>320.8 (60.1)</td>
                <td>307.8 (58.8)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Estimated glomerular filtration rate (mL/min/1.73 m<sup>2</sup>)</td>
                <td>83.6 (14.6)</td>
                <td>80.2 (14.1)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Eosinophil count (cells/mm<sup>3</sup>)</td>
                <td>183.2 (124.5)</td>
                <td>195.4 (125.9)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gamma-glutamyl transferase (U/L)</td>
                <td>42.7 (34.4)</td>
                <td>45.8 (34.5)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hemoglobin (g/dL)</td>
                <td>14.7 (1.4)</td>
                <td>14.9 (1.1)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hemoglobin A<sub>1c</sub> (%)</td>
                <td>5.3 (0.7)</td>
                <td>5.4 (0.7)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hematocrit (%)</td>
                <td>44.0 (3.6)</td>
                <td>44.6 (3.1)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MCH<sup>d</sup> (pg)</td>
                <td>30.5 (1.8)</td>
                <td>31.1 (1.7)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MCHC<sup>e</sup> (g/L)</td>
                <td>33.4 (1.0)</td>
                <td>33.3 (0.8)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MCV<sup>f</sup> (fL)</td>
                <td>91.3 (4.6)</td>
                <td>93.4 (4.4)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>WBC<sup>g</sup> count (×10<sup>2</sup> cells/µL)</td>
                <td>58.8 (15.0)</td>
                <td>62.8 (15.5)</td>
                <td>&#60;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>COPD: chronic obstructive pulmonary disease.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>FEV<sub>1</sub>: forced expiratory volume in 1 second.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>FVC: forced vital capacity.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>MCH: mean corpuscular hemoglobin.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>MCHC: mean corpuscular hemoglobin concentration.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>MCV: mean corpuscular volume.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>WBC: white blood cell.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Percentage of Individuals With COPD</title>
        <p>The overall percentage of individuals with COPD was 6.0% (1489/24,815). According to smoking status, the percentage of individuals with COPD was 8.8% (1021/11,653) among current smokers and 5.4% (202/3736) among exsmokers. Notably, 2.8% (266/9419) of nonsmokers had developed COPD. The peak age at diagnosis of COPD among current smokers and exsmokers was 55 years and 65 years, respectively (<xref rid="figure2" ref-type="fig">Figure 2</xref>).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Diagnostic age for chronic obstructive pulmonary disease (COPD) according to smoking status.</p>
          </caption>
          <graphic xlink:href="medinform_v9i7e24796_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Risk Factors for COPD Diagnosis</title>
        <p>Overall, 20,265 individuals (COPD: n=954; non-COPD: n=19,311) with 51,432 records (COPD: n=2435; non-COPD: n=48,997) out of 24,815 individuals who met the criteria (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>) were included in the machine learning analysis. <xref ref-type="table" rid="table2">Table 2</xref> shows the model performance of the XGBoost and logistic regression models. For both models, the AUC, accuracy, sensitivity, specificity, and F-measure were generally similar between the training and test data sets. The XGBoost model had a higher positive predictive value (0.505) than the logistic regression model (0.441). The AUC was high in the training and test sets for both models (range: 0.892-0.956). Additionally, the accuracy and specificity exceeded 0.883 and 0.879, respectively, for both models.</p>
        <p>The most important predictive factors for COPD diagnosis were lung function tests (ie, FEV<sub>1</sub>/FVC, percent vital capacity [%VC], and %FEV<sub>1</sub>) and smoking status, followed by cough, hematological indices (ie, MCV, MCHC, MCH, Hb, and HT), treatment with antidiabetic drugs, hemoglobin A<sub>1c</sub>, serum albumin, total protein, and BMI. Other predictive risk factors were EOS, serum alanine aminotransferase, WBC count, and urinary WBC count (<xref ref-type="table" rid="table3">Table 3</xref>). Logistic regression analysis showed that low FEV<sub>1</sub>/FVC and %FEV<sub>1</sub>; high %VC; high MCV, MCHC, and Hb; and low HT and MCH were related factors, and that individuals treated with antidiabetic drugs had a higher number of associated risk factors for COPD. Low serum albumin, low total protein, and low BMI were also confirmed as risk factors (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comparison of performance of the Gradient Boosting Decision Tree machine learning (XGBoost) and logistic regression models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="230"/>
            <col width="230"/>
            <col width="160"/>
            <col width="0"/>
            <col width="250"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Variable</td>
                <td colspan="3">XGBoost<sup>a</sup> model</td>
                <td colspan="2">Logistic regression model</td>
              </tr>
              <tr valign="top">
                <td>Training, mean (SE)</td>
                <td>Test, mean</td>
                <td colspan="2">Training, mean (SE)</td>
                <td>Test, mean</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Positive predictive value</td>
                <td>0.505 (0.099)</td>
                <td>0.362</td>
                <td colspan="2">0.441 (0.110)</td>
                <td>0.285</td>
              </tr>
              <tr valign="top">
                <td>AUC<sup>b</sup></td>
                <td>0.956 (0.015)</td>
                <td>0.898</td>
                <td colspan="2">0.943 (0.022)</td>
                <td>0.892</td>
              </tr>
              <tr valign="top">
                <td>Accuracy</td>
                <td>0.917 (0.032)</td>
                <td>0.918</td>
                <td colspan="2">0.884 (0.049)</td>
                <td>0.883</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity</td>
                <td>0.845 (0.021)</td>
                <td>0.877</td>
                <td colspan="2">0.874 (0.039)</td>
                <td>0.901</td>
              </tr>
              <tr valign="top">
                <td>Specificity</td>
                <td>0.960 (0.016)</td>
                <td>0.919</td>
                <td colspan="2">0.946 (0.025)</td>
                <td>0.882</td>
              </tr>
              <tr valign="top">
                <td>F-measure</td>
                <td>0.370 (0.107)</td>
                <td>0.513</td>
                <td colspan="2">0.306 (0.110)</td>
                <td>0.434</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>XGBoost: Gradient Boosting Decision Tree machine learning.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>AUC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Importance of each predictor in the XGBoost model.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="750"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Variable</td>
                <td>Importance value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Forced expiratory volume in 1 second/forced vital capacity</td>
                <td>0.2824</td>
              </tr>
              <tr valign="top">
                <td>Smoking status</td>
                <td>0.0329</td>
              </tr>
              <tr valign="top">
                <td>Allergic symptoms (yes/no)</td>
                <td>0.0303</td>
              </tr>
              <tr valign="top">
                <td>Symptom-cough (yes/no)</td>
                <td>0.0294</td>
              </tr>
              <tr valign="top">
                <td>Smoking-pack year</td>
                <td>0.0222</td>
              </tr>
              <tr valign="top">
                <td>Hemoglobin A<sub>1c</sub></td>
                <td>0.0197</td>
              </tr>
              <tr valign="top">
                <td>Albumin</td>
                <td>0.0195</td>
              </tr>
              <tr valign="top">
                <td>Mean corpuscular volume</td>
                <td>0.0177</td>
              </tr>
              <tr valign="top">
                <td>%Vital capacity</td>
                <td>0.0165</td>
              </tr>
              <tr valign="top">
                <td>%Forced expiratory volume in 1 second</td>
                <td>0.0164</td>
              </tr>
              <tr valign="top">
                <td>Treatment with an antidiabetic drug (yes/no)</td>
                <td>0.0162</td>
              </tr>
              <tr valign="top">
                <td>Allergic disease (yes/no)</td>
                <td>0.0146</td>
              </tr>
              <tr valign="top">
                <td>Hematocrit</td>
                <td>0.0144</td>
              </tr>
              <tr valign="top">
                <td>Urinary red blood cells</td>
                <td>0.0143</td>
              </tr>
              <tr valign="top">
                <td>Hemoglobin</td>
                <td>0.0138</td>
              </tr>
              <tr valign="top">
                <td>Age</td>
                <td>0.0128</td>
              </tr>
              <tr valign="top">
                <td>Smoking duration</td>
                <td>0.0127</td>
              </tr>
              <tr valign="top">
                <td>High density lipoprotein cholesterol</td>
                <td>0.0123</td>
              </tr>
              <tr valign="top">
                <td>Mean corpuscular hemoglobin concentration</td>
                <td>0.0122</td>
              </tr>
              <tr valign="top">
                <td>Total protein</td>
                <td>0.0118</td>
              </tr>
              <tr valign="top">
                <td>BMI</td>
                <td>0.0118</td>
              </tr>
              <tr valign="top">
                <td>Number of eosinophils</td>
                <td>0.0115</td>
              </tr>
              <tr valign="top">
                <td>Mean corpuscular hemoglobin</td>
                <td>0.0114</td>
              </tr>
              <tr valign="top">
                <td>Serum white blood cells</td>
                <td>0.0111</td>
              </tr>
              <tr valign="top">
                <td>Fasting blood sugar</td>
                <td>0.0110</td>
              </tr>
              <tr valign="top">
                <td>Serum alanine aminotransferase</td>
                <td>0.0108</td>
              </tr>
              <tr valign="top">
                <td>Pulse rate</td>
                <td>0.0108</td>
              </tr>
              <tr valign="top">
                <td>Forced expiratory volume in 1 second</td>
                <td>0.0107</td>
              </tr>
              <tr valign="top">
                <td>Urinary white blood cells</td>
                <td>0.0104</td>
              </tr>
              <tr valign="top">
                <td>Diastolic blood pressure</td>
                <td>0.0103</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>For future utilization of risk factors for disease assessment in daily clinical practice, the machine learning process was validated using a questionnaire to predict risk factors for COPD development (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Of 30 variables, 25 were clinical parameters that overlapped between the two methods. The top 30 risk factors also included the following five questions: “I am regularly doing exercise,” “I have chest compression and pain,” “Average sleeping time in the past 1 month,” “I have breakfast every day,” and “Body fat ratio” (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Among these, logistic regression analysis showed that insufficient sleeping time and not having breakfast every day were risk factors for COPD (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>This study applied a machine learning method, a powerful tool to analyze large quantities of complex data, to predict risk factors for COPD. This is the first study to investigate more than 300,000 records from working-age adults in Japan utilizing an annual medical check-up database. This system allows healthy employees to track their health conditions over time by clinical measurements and questionnaires. We found that the most significant predictor of COPD diagnosis was the absolute value of FEV<sub>1</sub>/FVC, indicating that low FEV<sub>1</sub> in early adulthood is an important factor in the development of COPD. Childhood asthma is associated with impaired lung function, lower lung function in adulthood, and higher risk of COPD even for nonsmoker participants, as previously reported by Martinez et al [<xref ref-type="bibr" rid="ref21">21</xref>]. In our speculation, some part of the nonsmoker COPD population might have had a history of childhood asthma, increasing susceptibility to passive smoke exposure or airway pollution and resulting in the early diagnosis of COPD in nonsmokers compared with exsmokers in the study. Smoking status had the second highest impact on disease diagnosis. Among individuals with a smoking history, the peak age of COPD diagnosis was older in exsmokers than in current smokers. This finding suggests that smoking cessation delays the diagnosis of COPD, consistent with a previous study in which smoking cessation was reported to affect the natural history of COPD [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>Erythrocyte indices (MCV and MCHC) might also be available as potential predictors of COPD diagnosis in addition to lung function measurements. These data are supported by a previous report in which continuous smoking had a significant effect on hematological parameters compared with nonsmoking, and it may be associated with an increased risk of COPD [<xref ref-type="bibr" rid="ref23">23</xref>]. The increased levels of MCV and MCHC in individuals with COPD support a previous finding that impaired lung function has a strong association with ischemic heart disease [<xref ref-type="bibr" rid="ref24">24</xref>]. Conversely, the presence of an allergic disease appeared to have a preventive effect on airflow limitation, which is in contrast with observations from the Tasmanian Longitudinal Health Study in which the presence of allergic diseases was an early predictor of lung trajectories toward COPD [<xref ref-type="bibr" rid="ref25">25</xref>]. However, the Hokkaido cohort study showed that subjects with multiple asthma-like features had slower lung function decline [<xref ref-type="bibr" rid="ref26">26</xref>]. From the findings of our observational study in Japan, we can speculate that early diagnosis and intervention for allergic diseases may have less impact on lung function and that regular and frequent medical intervention could lead to an overall increase in life expectancy among patients who can readily access appropriate treatment by respiratory specialists.</p>
      <p>Furthermore, individuals with decreased levels of serum albumin and total protein, as well as lower hemoglobin A<sub>1c</sub> and BMI may be at risk of developing cachexia, a common condition among patients with COPD [<xref ref-type="bibr" rid="ref27">27</xref>]. With respect to other identified risk factors, a retrospective cross-sectional study showed an association between EOS and airflow limitation in patients with COPD [<xref ref-type="bibr" rid="ref28">28</xref>]. Given that increased alanine aminotransferase levels have been observed in patients with obstructive sleep apnea [<xref ref-type="bibr" rid="ref29">29</xref>], individuals at risk of developing COPD might be exposed to intermittent hypoxia, indicating that a reduced sleeping time, as determined in the study questionnaire, might also represent a risk factor for COPD. Even minor changes in hematological parameters might be attributable to hypoxic conditions, leading to sleep disruption. Additionally, frequently missing breakfast might accelerate malnutrition in the COPD group. Furthermore, significantly higher prevalence rates of chronic neck and lower back pain in patients with COPD compared with healthy individuals were observed in a population-based study, although the findings were not confirmed by logistic regression analysis [<xref ref-type="bibr" rid="ref30">30</xref>], and the link between COPD and back pain remains unknown. The observation of increased WBC counts in patients with COPD compared with healthy controls [<xref ref-type="bibr" rid="ref31">31</xref>] suggests that systemic inflammation may be involved in the pathogenesis of COPD [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
      <p>Our results also indicate that smoking cessation should be prioritized for the prevention of COPD and that smokers with sleep disturbances, back pain, and/or low BMI and malnutrition may be at increased risk of developing COPD and should be considered as candidates for lifestyle intervention therapy. Furthermore, the five key questions included in our questionnaire should be validated in future investigations and potentially implemented in daily practice as part of an annual medical check-up to prevent COPD.</p>
      <p>The positive predictive value of the XGBoost model was comparable to that of a self-scored persistent airflow obstruction screening questionnaire in the Japanese population previously reported by Samukawa et al [<xref ref-type="bibr" rid="ref33">33</xref>]. However, our models showed more accuracy because the sensitivity and specificity of our models achieved higher figures, and the AUC reached over 0.9 compared with that of the questionnaire, which ranged from 0.595 to 0.612. The AUCs of the XGBoost and logistic regression models were similar, while the most important factor related to COPD diagnosis was FEV<sub>1</sub> in both models. However, some variables differed in importance in each model. Kuhn et al reported that machine learning approaches can incorporate high-order nonlinear interactions among predictors that cannot be addressed by traditional modeling approaches (eg, logistic regression models) [<xref ref-type="bibr" rid="ref34">34</xref>]. However, machine learning methods cannot elucidate whether a causal relationship exists between the identified variable and the disease. Thus, the association between risk factors detected using a machine learning model and COPD requires validation in future prospective studies.</p>
      <p>A strength of this study was the use of longitudinal lung function test data from healthy individuals from April 1998 to March 2019. In general, medical checkup data are not linked to medical records, meaning that profiles of lung function tests over time could not be investigated. However, it was possible to evaluate longitudinal lung function tests because the database included data from individuals from a point in time when they were healthy until they had developed COPD. Additionally, data from healthy individuals were included, allowing lung function test results from when they were diagnosed with COPD to be investigated. Finally, both clinical measurements and questionnaire variables were included in the database, thereby increasing the potential to identify several different risk factors for COPD.</p>
      <p>The limitations of this study include the definition of COPD diagnosis by airflow limitation with pulmonary function tests. Instead of post-BD spirometry data as suggested by the ATS/European respiratory guidelines, we employed pre-BD spirometry data for the diagnosis of COPD since no post-BD spirometry was performed in the annual medical check-up. The precise diagnosis of COPD cannot always be demonstrated by airflow limitation alone; however, we believe that the diagnostic approach was reasonable from a clinical perspective as airflow limitation has been reported to be a poor prognostic factor in the general population [<xref ref-type="bibr" rid="ref35">35</xref>]. Low lung function values (FEV<sub>1</sub>/FVC &#60;0.7) might be observed at a single time point in some individuals for no discernable reason. Therefore, we considered COPD as lung function of FEV<sub>1</sub>/FVC &#60;0.7 on two consecutive occasions. In terms of differentiation between asthma and COPD, we cannot exclude the possibility of misclassification of asthma as COPD in some patients since reversibility tests were not performed in the annual medical check-up, but participants with a medical history of asthma were excluded. Additionally, a database from a single organization was analyzed in this study; thus, the results might include bias based on the type of industry or the organizational structure of the company, limiting the generalizability of the findings. To obtain more generalizable findings, studies using other databases are necessary. Finally, some unknown confounders may have remained; therefore, we plan to perform model validation by analyzing other databases. Well-controlled prospective studies should be conducted to confirm the predictive factors for COPD diagnosis.</p>
      <p>In conclusion, our machine learning method applied to longitudinal medical check-up data, including general questionnaires and laboratory parameters, identified hematological, nutritional, and inflammatory parameters as potential risk factors for COPD. These parameters, along with lung function and smoking status, may be useful in identifying at-risk individuals and may lead to an earlier diagnosis.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Clinical assessments and questions used in the analysis, and list of variables.</p>
        <media xlink:href="medinform_v9i7e24796_app1.docx" xlink:title="DOCX File , 56 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Numbers of records and individuals included in the machine learning model.</p>
        <media xlink:href="medinform_v9i7e24796_app2.docx" xlink:title="DOCX File , 42 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Association between chronic obstructive pulmonary disease and the top 30 variables of importance based on logistic regression.</p>
        <media xlink:href="medinform_v9i7e24796_app3.docx" xlink:title="DOCX File , 45 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Importance of each predictor in the XGBoost model (including questionnaire items).</p>
        <media xlink:href="medinform_v9i7e24796_app4.docx" xlink:title="DOCX File , 44 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">5-CV</term>
          <def>
            <p>five times for cross-validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BD</term>
          <def>
            <p>bronchodilator</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">COPD</term>
          <def>
            <p>chronic obstructive pulmonary disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EOS</term>
          <def>
            <p>eosinophil count</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">FEV1</term>
          <def>
            <p>forced expiratory volume in 1 second</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">FVC</term>
          <def>
            <p>forced vital capacity</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">Hb</term>
          <def>
            <p>hemoglobin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">HT</term>
          <def>
            <p>hematocrit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">MCHC</term>
          <def>
            <p>mean corpuscular hemoglobin concentration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MCV</term>
          <def>
            <p>mean corpuscular volume</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">WBC</term>
          <def>
            <p>white blood cell</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">XGBoost</term>
          <def>
            <p>Gradient Boosting Decision Tree machine learning method</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank ND Smith, Y Baba, and K Dohi of EMC Japan (Osaka, Japan) for critical reading and native checking of the manuscript. We also thank Tricia Newell and Clare Cox of Edanz Evidence Generation for providing editing support. This study was funded by AstraZeneca KK.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>SM and TK contributed to data interpretation and reviewed the manuscript. YH planned the analyses, contributed to data interpretation, and drafted the manuscript. MI designed the study and drafted the manuscript. SN, WT, and HB conducted the analyses. TN corrected and provided the data, and reviewed the analysis including data cleansing and preprocessing. All authors take full responsibility for the content and editorial decisions, and approved the final version.</p>
      </fn>
      <fn fn-type="conflict">
        <p>SM has received honoraria from AstraZeneca KK, Boehringer Ingelheim Japan, GlaxoSmithKline KK, Novartis Pharma KK, Meiji Seika Pharma Co, Ltd, Kyorin Pharmaceutical Co, Ltd, Otsuka Pharmaceutical Co, Ltd, Teijin Pharma Ltd, CHEST MI, Inc, Daiichi Sankyo Co, Ltd, Chugai Pharmaceutical Co, Ltd, Sanofi KK, Actelion Pharmaceuticals Japan Ltd, and Olympus Corporation. MI and YH are employees of AstraZeneca KK. WT, SN, HB, and TN are employees of Hitachi, Ltd.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vogelmeier</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Criner</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Anzueto</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bourbeau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Celli</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Decramer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbri</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Frith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Halpin</surname>
              <given-names>DMG</given-names>
            </name>
            <name name-style="western">
              <surname>López Varela</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Roche</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez-Roisin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sin</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Stockley</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vestbo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wedzicha</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Agustí</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Global Strategy for the Diagnosis, Management, and Prevention of Chronic Obstructive Lung Disease 2017 Report. GOLD Executive Summary</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2017</year>
          <month>03</month>
          <day>01</day>
          <volume>195</volume>
          <issue>5</issue>
          <fpage>557</fpage>
          <lpage>582</lpage>
          <pub-id pub-id-type="doi">10.1164/rccm.201701-0218PP</pub-id>
          <pub-id pub-id-type="medline">28128970</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Marco</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Accordini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Marcon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cerveri</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Antó</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Gislason</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Heinrich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Janson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jarvis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kuenzli</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Leynaert</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sunyer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Svanes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wjst</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burney</surname>
              <given-names>P</given-names>
            </name>
            <collab>European Community Respiratory Health Survey (ECRHS)</collab>
          </person-group>
          <article-title>Risk factors for chronic obstructive pulmonary disease in a European cohort of young adults</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2011</year>
          <month>04</month>
          <day>01</day>
          <volume>183</volume>
          <issue>7</issue>
          <fpage>891</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1164/rccm.201007-1125OC</pub-id>
          <pub-id pub-id-type="medline">20935112</pub-id>
          <pub-id pub-id-type="pii">201007-1125OC</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fletcher</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Peto</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The natural history of chronic airflow obstruction</article-title>
          <source>Br Med J</source>
          <year>1977</year>
          <month>06</month>
          <day>25</day>
          <volume>1</volume>
          <issue>6077</issue>
          <fpage>1645</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/871704"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.1.6077.1645</pub-id>
          <pub-id pub-id-type="medline">871704</pub-id>
          <pub-id pub-id-type="pmcid">PMC1607732</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lydick</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Silberman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kempel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Keating</surname>
              <given-names>ET</given-names>
            </name>
          </person-group>
          <article-title>The prevalence of COPD: using smoking rates to estimate disease frequency in the general population</article-title>
          <source>Chest</source>
          <year>2000</year>
          <month>05</month>
          <volume>117</volume>
          <issue>5 Suppl 2</issue>
          <fpage>354S</fpage>
          <lpage>9S</lpage>
          <pub-id pub-id-type="doi">10.1378/chest.117.5_suppl_2.354s</pub-id>
          <pub-id pub-id-type="medline">10843976</pub-id>
          <pub-id pub-id-type="pii">S0012-3692(15)32851-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fukuchi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ichinose</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Adachi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nagai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kuriyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ishioka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aizawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zaher</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>COPD in Japan: the Nippon COPD Epidemiology study</article-title>
          <source>Respirology</source>
          <year>2004</year>
          <month>11</month>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>458</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1440-1843.2004.00637.x</pub-id>
          <pub-id pub-id-type="medline">15612956</pub-id>
          <pub-id pub-id-type="pii">RES637</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Soriano</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Zielinski</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Screening for and early detection of chronic obstructive pulmonary disease</article-title>
          <source>The Lancet</source>
          <year>2009</year>
          <month>08</month>
          <day>29</day>
          <volume>374</volume>
          <issue>9691</issue>
          <fpage>721</fpage>
          <lpage>732</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(09)61290-3</pub-id>
          <pub-id pub-id-type="medline">19716965</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(09)61290-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Larsson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Janson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ställberg</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lisspers</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Olsson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kostikas</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gruenberger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gutzwiller</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Uhde</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jorgensen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Johansson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Impact of COPD diagnosis timing on clinical and economic outcomes: the ARCTIC observational cohort study</article-title>
          <source>Int J Chron Obstruct Pulmon Dis</source>
          <year>2019</year>
          <volume>14</volume>
          <fpage>995</fpage>
          <lpage>1008</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/COPD.S195382"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/COPD.S195382</pub-id>
          <pub-id pub-id-type="medline">31190785</pub-id>
          <pub-id pub-id-type="pii">195382</pub-id>
          <pub-id pub-id-type="pmcid">PMC6526023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Muro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tabara</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Matsumoto</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Setoh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kawaguchi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ito</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ito</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Murase</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Terao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kosugi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yamada</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sekine</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nakayama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mishima</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>F</given-names>
            </name>
            <collab>Nagahama Study Group</collab>
          </person-group>
          <article-title>Relationship Among Chlamydia and Mycoplasma Pneumoniae Seropositivity, IKZF1 Genotype and Chronic Obstructive Pulmonary Disease in A General Japanese Population: The Nagahama Study</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2016</year>
          <month>04</month>
          <volume>95</volume>
          <issue>15</issue>
          <fpage>e3371</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1097/MD.0000000000003371"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000003371</pub-id>
          <pub-id pub-id-type="medline">27082601</pub-id>
          <pub-id pub-id-type="pii">00005792-201604120-00064</pub-id>
          <pub-id pub-id-type="pmcid">PMC4839845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sato</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shibata</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Inoue</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Igarashi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tokairin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yamauchi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nemoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sato</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nakano</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Machida</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nishiwaki</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kobayashi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Minegishi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Furuyama</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Watanabe</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Konta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ueno</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kayama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kubota</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Impact of cigarette smoking on decline in forced expiratory volume in 1s relative to severity of airflow obstruction in a Japanese general population: The Yamagata-Takahata study</article-title>
          <source>Respir Investig</source>
          <year>2018</year>
          <month>03</month>
          <volume>56</volume>
          <issue>2</issue>
          <fpage>120</fpage>
          <lpage>127</lpage>
          <pub-id pub-id-type="doi">10.1016/j.resinv.2017.11.011</pub-id>
          <pub-id pub-id-type="medline">29548649</pub-id>
          <pub-id pub-id-type="pii">S2212-5345(17)30157-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Adab</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sitch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Enocson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blissett</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jowett</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Marsh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Jolly</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ayres</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Haroon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stockley</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Greenfield</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Siebert</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Daley</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzmaurice</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Targeted case finding for chronic obstructive pulmonary disease versus routine practice in primary care (TargetCOPD): a cluster-randomised controlled trial</article-title>
          <source>The Lancet Respiratory Medicine</source>
          <year>2016</year>
          <month>09</month>
          <volume>4</volume>
          <issue>9</issue>
          <fpage>720</fpage>
          <lpage>730</lpage>
          <pub-id pub-id-type="doi">10.1016/S2213-2600(16)30149-7</pub-id>
          <pub-id pub-id-type="medline">27444687</pub-id>
          <pub-id pub-id-type="pii">S2213-2600(16)30149-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Bragman</surname>
              <given-names>FJS</given-names>
            </name>
            <name name-style="western">
              <surname>Rangelov</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Galbán</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkes</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Hurst</surname>
              <given-names>JR</given-names>
            </name>
            <collab>COPDGene Investigators</collab>
          </person-group>
          <article-title>Disease Progression Modeling in Chronic Obstructive Pulmonary Disease</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2020</year>
          <month>02</month>
          <day>01</day>
          <volume>201</volume>
          <issue>3</issue>
          <fpage>294</fpage>
          <lpage>302</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31657634"/>
          </comment>
          <pub-id pub-id-type="doi">10.1164/rccm.201908-1600OC</pub-id>
          <pub-id pub-id-type="medline">31657634</pub-id>
          <pub-id pub-id-type="pmcid">PMC6999095</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KG</given-names>
            </name>
          </person-group>
          <article-title>Transparent Reporting of a multivariable prediction model for Individual Prognosis or Diagnosis (TRIPOD): the TRIPOD statement</article-title>
          <source>Ann Intern Med</source>
          <year>2015</year>
          <month>01</month>
          <day>06</day>
          <volume>162</volume>
          <issue>1</issue>
          <fpage>55</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.7326/M14-0697</pub-id>
          <pub-id pub-id-type="medline">25560714</pub-id>
          <pub-id pub-id-type="pii">2088549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sugiyama</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tomata</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takemi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsushita</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hashimoto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Miyachi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yamagata</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yokoyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsuji</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Awareness and health consciousness regarding the national health plan "Health Japan 21" (2nd edition) among the Japanese population in 2013 and 2014</article-title>
          <source>Nihon Koshu Eisei Zasshi</source>
          <year>2016</year>
          <volume>63</volume>
          <issue>8</issue>
          <fpage>424</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.11236/jph.63.8_424"/>
          </comment>
          <pub-id pub-id-type="doi">10.11236/jph.63.8_424</pub-id>
          <pub-id pub-id-type="medline">27681283</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Terzikhan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Verhamme</surname>
              <given-names>KMC</given-names>
            </name>
            <name name-style="western">
              <surname>Hofman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stricker</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Brusselle</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Lahousse</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and incidence of COPD in smokers and non-smokers: the Rotterdam Study</article-title>
          <source>Eur J Epidemiol</source>
          <year>2016</year>
          <month>08</month>
          <volume>31</volume>
          <issue>8</issue>
          <fpage>785</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26946425"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10654-016-0132-z</pub-id>
          <pub-id pub-id-type="medline">26946425</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10654-016-0132-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC5005388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Hankinson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brusasco</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Burgos</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Casaburi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Coates</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Crapo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Enright</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>van der Grinten</surname>
              <given-names>CPM</given-names>
            </name>
            <name name-style="western">
              <surname>Gustafsson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>MacIntyre</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>McKay</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Navajas</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>OF</given-names>
            </name>
            <name name-style="western">
              <surname>Pellegrino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Viegi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wanger</surname>
              <given-names>J</given-names>
            </name>
            <collab>ATS/ERS Task Force</collab>
          </person-group>
          <article-title>Standardisation of spirometry</article-title>
          <source>Eur Respir J</source>
          <year>2005</year>
          <month>08</month>
          <volume>26</volume>
          <issue>2</issue>
          <fpage>319</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=16055882"/>
          </comment>
          <pub-id pub-id-type="doi">10.1183/09031936.05.00034805</pub-id>
          <pub-id pub-id-type="medline">16055882</pub-id>
          <pub-id pub-id-type="pii">26/2/319</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Celli</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>MacNee</surname>
              <given-names>W</given-names>
            </name>
            <collab>ATS/ERS Task Force</collab>
          </person-group>
          <article-title>Standards for the diagnosis and treatment of patients with COPD: a summary of the ATS/ERS position paper</article-title>
          <source>Eur Respir J</source>
          <year>2004</year>
          <month>06</month>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>932</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=15219010"/>
          </comment>
          <pub-id pub-id-type="doi">10.1183/09031936.04.00014304</pub-id>
          <pub-id pub-id-type="medline">15219010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost : A Scalable Tree Boosting System</article-title>
          <source>KDD '16: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <conf-name>22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bien</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Strong rules for discarding predictors in lasso-type problems</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>2012</year>
          <month>03</month>
          <volume>74</volume>
          <issue>2</issue>
          <fpage>245</fpage>
          <lpage>266</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25506256"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1467-9868.2011.01004.x</pub-id>
          <pub-id pub-id-type="medline">25506256</pub-id>
          <pub-id pub-id-type="pmcid">PMC4262615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>James</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Witten</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Introduction</article-title>
          <source>An Introduction to Statistical Learning. Springer Texts in Statistics, vol 103</source>
          <year>2013</year>
          <publisher-loc>New York, USA</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>DeLong</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>DeLong</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke-Pearson</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>Comparing the areas under two or more correlated receiver operating characteristic curves: a nonparametric approach</article-title>
          <source>Biometrics</source>
          <year>1988</year>
          <month>09</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>837</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="medline">3203132</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Allinson</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Barr</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Boucher</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Calverley</surname>
              <given-names>PMA</given-names>
            </name>
            <name name-style="western">
              <surname>Celli</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Christenson</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Crystal</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Fagerås</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Groenke</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Kesimer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kostikas</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Paine</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rafii</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rennard</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Segal</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Shaykhiev</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stevenson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tal-Singer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vestbo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Woodruff</surname>
              <given-names>PG</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Wedzicha</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>At the Root: Defining and Halting Progression of Early Chronic Obstructive Pulmonary Disease</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2018</year>
          <month>06</month>
          <day>15</day>
          <volume>197</volume>
          <issue>12</issue>
          <fpage>1540</fpage>
          <lpage>1551</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29406779"/>
          </comment>
          <pub-id pub-id-type="doi">10.1164/rccm.201710-2028PP</pub-id>
          <pub-id pub-id-type="medline">29406779</pub-id>
          <pub-id pub-id-type="pmcid">PMC6006401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Smoking cessation affects the natural history of COPD</article-title>
          <source>Int J Chron Obstruct Pulmon Dis</source>
          <year>2017</year>
          <volume>12</volume>
          <fpage>3323</fpage>
          <lpage>3328</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/COPD.S150243"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/COPD.S150243</pub-id>
          <pub-id pub-id-type="medline">29180862</pub-id>
          <pub-id pub-id-type="pii">copd-12-3323</pub-id>
          <pub-id pub-id-type="pmcid">PMC5695262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malenica</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prnjavorac</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bego</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dujic</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Semiz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Skrbo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gusic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hadzic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Causevic</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Effect of Cigarette Smoking on Haematological Parameters in Healthy Population</article-title>
          <source>Med Arch</source>
          <year>2017</year>
          <month>04</month>
          <volume>71</volume>
          <issue>2</issue>
          <fpage>132</fpage>
          <lpage>136</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28790546"/>
          </comment>
          <pub-id pub-id-type="doi">10.5455/medarh.2017.71.132-136</pub-id>
          <pub-id pub-id-type="medline">28790546</pub-id>
          <pub-id pub-id-type="pii">MA-71-132</pub-id>
          <pub-id pub-id-type="pmcid">PMC5511531</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eriksson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lindberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Müllerova</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rönmark</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lundbäck</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Association of heart diseases with COPD and restrictive lung function--results from a population survey</article-title>
          <source>Respir Med</source>
          <year>2013</year>
          <month>01</month>
          <volume>107</volume>
          <issue>1</issue>
          <fpage>98</fpage>
          <lpage>106</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0954-6111(12)00352-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.rmed.2012.09.011</pub-id>
          <pub-id pub-id-type="medline">23127573</pub-id>
          <pub-id pub-id-type="pii">S0954-6111(12)00352-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Lodge</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Burgess</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Perret</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>MQ</given-names>
            </name>
            <name name-style="western">
              <surname>Bowatte</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gurrin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Johns</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Frith</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Jarvis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Svanes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Feather</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wood-Baker</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hopper</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Giles</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Abramson</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Walters</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Matheson</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Dharmage</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Childhood predictors of lung function trajectories and future COPD risk: a prospective cohort study from the first to the sixth decade of life</article-title>
          <source>Lancet Respir Med</source>
          <year>2018</year>
          <month>07</month>
          <volume>6</volume>
          <issue>7</issue>
          <fpage>535</fpage>
          <lpage>544</lpage>
          <pub-id pub-id-type="doi">10.1016/S2213-2600(18)30100-0</pub-id>
          <pub-id pub-id-type="medline">29628376</pub-id>
          <pub-id pub-id-type="pii">S2213-2600(18)30100-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suzuki</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Makita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Konno</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>M</given-names>
            </name>
            <collab>Hokkaido COPD Cohort Study Investigators</collab>
          </person-group>
          <article-title>Asthma-like Features and Clinical Course of Chronic Obstructive Pulmonary Disease. An Analysis from the Hokkaido COPD Cohort Study</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2016</year>
          <month>12</month>
          <day>01</day>
          <volume>194</volume>
          <issue>11</issue>
          <fpage>1358</fpage>
          <lpage>1365</lpage>
          <pub-id pub-id-type="doi">10.1164/rccm.201602-0353OC</pub-id>
          <pub-id pub-id-type="medline">27224255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>von Haehling</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Anker</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Anker</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and clinical impact of cachexia in chronic illness in Europe, USA, and Japan: facts and numbers update 2016</article-title>
          <source>J Cachexia Sarcopenia Muscle</source>
          <year>2016</year>
          <month>12</month>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>507</fpage>
          <lpage>509</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/jcsm.12167"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/jcsm.12167</pub-id>
          <pub-id pub-id-type="medline">27891294</pub-id>
          <pub-id pub-id-type="pii">JCSM12167</pub-id>
          <pub-id pub-id-type="pmcid">PMC5114624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The association between airflow limitation and blood eosinophil levels with treatment outcomes in patients with chronic obstructive pulmonary disease and prolonged mechanical ventilation</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>09</month>
          <day>17</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>13420</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-019-49918-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-019-49918-z</pub-id>
          <pub-id pub-id-type="medline">31530874</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-019-49918-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6748958</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sumi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ogawa</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Masuzaki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Muro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hattori</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Matsumoto</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Niimi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chiba</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nakao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mishima</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ohi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Effects of obstructive sleep apnea syndrome on serum aminotransferase levels in obese patients</article-title>
          <source>Am J Med</source>
          <year>2003</year>
          <month>04</month>
          <day>01</day>
          <volume>114</volume>
          <issue>5</issue>
          <fpage>370</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/s0002-9343(02)01570-x</pub-id>
          <pub-id pub-id-type="medline">12714126</pub-id>
          <pub-id pub-id-type="pii">S000293430201570X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Miguel-Díez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>López-de-Andrés</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Barrera</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez-Trujillo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Del Barrio</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Puente-Maestu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez-Huedo</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez-García</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of Pain in COPD Patients and Associated Factors: Report From a Population-based Study</article-title>
          <source>Clin J Pain</source>
          <year>2018</year>
          <month>09</month>
          <volume>34</volume>
          <issue>9</issue>
          <fpage>787</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1097/AJP.0000000000000598</pub-id>
          <pub-id pub-id-type="medline">29485534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biljak</surname>
              <given-names>VR</given-names>
            </name>
            <name name-style="western">
              <surname>Pancirov</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cepelak</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Popović-Grle</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stjepanović</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grubišić</surname>
              <given-names>TŽ</given-names>
            </name>
          </person-group>
          <article-title>Platelet count, mean platelet volume and smoking status in stable chronic obstructive pulmonary disease</article-title>
          <source>Platelets</source>
          <year>2011</year>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>466</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.3109/09537104.2011.573887</pub-id>
          <pub-id pub-id-type="medline">21506665</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agustí</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Rennard</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>MacNee</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tal-Singer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Vestbo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lomas</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Calverley</surname>
              <given-names>PMA</given-names>
            </name>
            <name name-style="western">
              <surname>Wouters</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Crim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yates</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Silverman</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Coxson</surname>
              <given-names>HO</given-names>
            </name>
            <name name-style="western">
              <surname>Bakke</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Celli</surname>
              <given-names>B</given-names>
            </name>
            <collab>Evaluation of COPD Longitudinally to Identify Predictive Surrogate Endpoints (ECLIPSE) Investigators</collab>
          </person-group>
          <article-title>Persistent systemic inflammation is associated with poor clinical outcomes in COPD: a novel phenotype</article-title>
          <source>PLoS One</source>
          <year>2012</year>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e37483</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0037483"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0037483</pub-id>
          <pub-id pub-id-type="medline">22624038</pub-id>
          <pub-id pub-id-type="pii">PONE-D-12-05051</pub-id>
          <pub-id pub-id-type="pmcid">PMC3356313</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Samukawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Matsumoto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tsukuya</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Koriyama</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fukuyama</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Uchida</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mizuno</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Miyahara</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kiyohara</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ninomiya</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Inoue</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Development of a self-scored persistent airflow obstruction screening questionnaire in a general Japanese population: the Hisayama study</article-title>
          <source>Int J Chron Obstruct Pulmon Dis</source>
          <year>2017</year>
          <volume>12</volume>
          <fpage>1469</fpage>
          <lpage>1481</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/COPD.S130453"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/COPD.S130453</pub-id>
          <pub-id pub-id-type="medline">28553099</pub-id>
          <pub-id pub-id-type="pii">copd-12-1469</pub-id>
          <pub-id pub-id-type="pmcid">PMC5439935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Egert</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Steinbeck</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Building blocks for automated elucidation of metabolites: machine learning methods for NMR prediction</article-title>
          <source>BMC Bioinformatics</source>
          <year>2008</year>
          <month>09</month>
          <day>25</day>
          <volume>9</volume>
          <fpage>400</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-9-400"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-9-400</pub-id>
          <pub-id pub-id-type="medline">18817546</pub-id>
          <pub-id pub-id-type="pii">1471-2105-9-400</pub-id>
          <pub-id pub-id-type="pmcid">PMC2605476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akkermans</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Biermans</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Robberts</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>ter Riet</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Weel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wensing</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schermer</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>COPD prognosis in relation to diagnostic criteria for airflow obstruction in smokers</article-title>
          <source>Eur Respir J</source>
          <year>2014</year>
          <month>01</month>
          <volume>43</volume>
          <issue>1</issue>
          <fpage>54</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=23563262"/>
          </comment>
          <pub-id pub-id-type="doi">10.1183/09031936.00158212</pub-id>
          <pub-id pub-id-type="medline">23563262</pub-id>
          <pub-id pub-id-type="pii">09031936.00158212</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
