<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i4e34274</article-id>
      <article-id pub-id-type="pmid">35377334</article-id>
      <article-id pub-id-type="doi">10.2196/34274</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Exploring Patient Multimorbidity and Complexity Using Health Insurance Claims Data: A Cluster Analysis Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Wenhui</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ioakeim-Skoufa</surname>
            <given-names>Ignatios</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Nicolet</surname>
            <given-names>Anna</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Primary Care and Public Health (Unisanté)</institution>
            <institution>University of Lausanne</institution>
            <addr-line>Route de la Corniche</addr-line>
            <addr-line>Lausanne, 1010</addr-line>
            <country>Switzerland</country>
            <phone>41 21 314 23 4</phone>
            <email>anna.nicolet@unisante.ch</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9125-1697</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Assouline</surname>
            <given-names>Dan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2394-6571</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Le Pogam</surname>
            <given-names>Marie-Annick</given-names>
          </name>
          <degrees>MD, MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1672-3644</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Perraudin</surname>
            <given-names>Clémence</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3533-2764</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Bagnoud</surname>
            <given-names>Christophe</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6427-8031</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Wagner</surname>
            <given-names>Joël</given-names>
          </name>
          <degrees>PhD, Prof Dr</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3712-5494</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Marti</surname>
            <given-names>Joachim</given-names>
          </name>
          <degrees>PhD, Prof Dr</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5763-3704</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Peytremann-Bridevaux</surname>
            <given-names>Isabelle</given-names>
          </name>
          <degrees>MD, MPH, DSc, Prof Dr</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6514-8781</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Primary Care and Public Health (Unisanté)</institution>
        <institution>University of Lausanne</institution>
        <addr-line>Lausanne</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Groupe Mutuel</institution>
        <addr-line>Martigny</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Actuarial Science</institution>
        <institution>Faculty of Business and Economics, and Swiss Finance Institute</institution>
        <institution>University of Lausanne</institution>
        <addr-line>Lausanne</addr-line>
        <country>Switzerland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Anna Nicolet <email>anna.nicolet@unisante.ch</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>4</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>4</day>
        <month>4</month>
        <year>2022</year>
      </pub-date>
      <volume>10</volume>
      <issue>4</issue>
      <elocation-id>e34274</elocation-id>
      <history>
        <date date-type="received">
          <day>14</day>
          <month>10</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>12</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>4</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>6</day>
          <month>2</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Anna Nicolet, Dan Assouline, Marie-Annick Le Pogam, Clémence Perraudin, Christophe Bagnoud, Joël Wagner, Joachim Marti, Isabelle Peytremann-Bridevaux. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 04.04.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2022/4/e34274" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Although the trend of progressing morbidity is widely recognized, there are numerous challenges when studying multimorbidity and patient complexity. For multimorbid or complex patients, prone to fragmented care and high health care use, novel estimation approaches need to be developed.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to investigate the patient multimorbidity and complexity of Swiss residents aged ≥50 years using clustering methodology in claims data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We adopted a clustering methodology based on random forests and used 34 pharmacy-based cost groups as the only input feature for the procedure. To detect clusters, we applied hierarchical density-based spatial clustering of applications with noise. The reasonable hyperparameters were chosen based on various metrics embedded in the algorithms (out-of-bag misclassification error, normalized stress, and cluster persistence) and the clinical relevance of the obtained clusters.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Based on cluster analysis output for 18,732 individuals, we identified an outlier group and 7 clusters: individuals without diseases, patients with only hypertension-related diseases, patients with only mental diseases, complex high-cost high-need patients, slightly complex patients with inexpensive low-severity pharmacy-based cost groups, patients with 1 costly disease, and older high-risk patients.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study demonstrated that cluster analysis based on pharmacy-based cost group information from claims-based data is feasible and highlights clinically relevant clusters. Such an approach allows expanding the understanding of multimorbidity beyond simple disease counts and can identify the population profiles with increased health care use and costs. This study may foster the development of integrated and coordinated care, which is high on the agenda in policy making, care planning, and delivery.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>multimorbidity</kwd>
        <kwd>pharmacy cost groups</kwd>
        <kwd>cluster analysis</kwd>
        <kwd>claims data</kwd>
        <kwd>patient complexity</kwd>
        <kwd>health claims</kwd>
        <kwd>informatics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Health care systems worldwide are facing considerable challenges from the increasing number of chronic and multimorbid patients, characterized by complex needs and frequent transitions between care settings [<xref ref-type="bibr" rid="ref1">1</xref>]. In Switzerland, 2.2 million people report a chronic disease and nearly 20% of the population older than 50 years have multiple chronic diseases (multimorbidity) [<xref ref-type="bibr" rid="ref2">2</xref>]. Although the trend of progressing multimorbidity is widely recognized [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>], it is still unclear how best to take care of patients with multimorbidity and which interventions would be effective. For more than two decades, integrated and coordinated care have been developed worldwide [<xref ref-type="bibr" rid="ref7">7</xref>]. Nevertheless, integrated and coordinated care faces continuing challenges such as scaling-up, implementation, and sustainability difficulties. Additionally, integrated and coordinated care requires development of novel approaches to evaluate and measure patients multimorbidity and complexity. This is key to stratify the targeted population and adapt the intervention to the needs of the patients. Often, such evaluations and measures rely on morbidity indices (eg, Charlson and Elixhauser) or on the number of (self-reported) chronic conditions or comorbidities [<xref ref-type="bibr" rid="ref8">8</xref>]. Whereas the former were developed in an inpatient setting as predictors of mortality, the latter may not comprehensively reflect the patient’s disease burden and complexity. Despite these limitations, they remain often used because of their relative accessibility and simplicity. In settings where electronic medical (health) records, national disease registries, or data on chronic conditions are unavailable, administrative health insurance claims data represent a potentially useful source of information. In fact, they are increasingly used in health services research, especially to express multimorbidity using pharmacy-based cost groups (PCGs) [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. PCGs, based on use of prescribed drugs rather than on clinical information, were developed as a proxy for morbidity measure [<xref ref-type="bibr" rid="ref11">11</xref>]. Although the approach has limitations related to underestimation of medicines used, unclaimed, or paid out-of-pocket and thus not present in the data or the assumption that the drug is used exclusively for treating the particular condition [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], it allows mapping patient profiles to reflect their morbidity status. As such mapping approaches and comorbidity counts are considered simplistic [<xref ref-type="bibr" rid="ref13">13</xref>], researchers may consider alternative methods to investigate patient complexity more exhaustively. One such method is cluster analysis, which relies on the idea that many common conditions cluster together in the population in predictable patterns [<xref ref-type="bibr" rid="ref13">13</xref>]. It has been shown that cluster analysis of real-world data for drug use research can be used for detecting clinically plausible subgroups [<xref ref-type="bibr" rid="ref14">14</xref>]. Similar approaches of classifications based on multimorbidity patterns have been applied in the literature [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], but using PCGs as the multimorbidity indicator for cluster analysis is novel. In that context, the aim of our study is to investigate patient multimorbidity and complexity beyond simple mapping and counts of PCGs, using clustering methodology in claims data of Swiss residents aged ≥50 years.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Source and Sample</title>
        <p>We included data of 240,511 insured people aged ≥50 years continuously enrolled in one of the largest health insurance companies in Switzerland, Groupe Mutuel, for the 2015-2018 period. In addition to demographic information (age and gender), data contained PCGs for each individual, costs covered by the patient (cost sharing), type of health insurance model (with or without gatekeeping), and reimbursed health care services: number of visits to various physicians with associated costs and physicians’ specialization and hospitalizations. To identify insured persons with cost-intensive, chronic diseases and correspondingly high health care use based on their drug consumption, health insurance companies are translating the drug use data reflecting active ingredient and quantity, based on Anatomical Therapeutic Chemical and defined daily dose, into the PCGs. This procedure was developed and officially accepted by the Federal Office of Public Health in Switzerland [<xref ref-type="bibr" rid="ref17">17</xref>]. In our study, the patients were classified as multimorbid when they were assigned two or more PCGs, based on their yearly drug use.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Data were deidentified by the insurance company to guarantee anonymization, and ethical approval for this study was waived by the Cantonal Commission for the Ethics of Research on Human Beings (Lausanne, Switzerland).</p>
      </sec>
      <sec>
        <title>Cluster Analysis</title>
        <p>We adopted a clustering methodology based on random forests (RFs) [<xref ref-type="bibr" rid="ref18">18</xref>]—a popular classification and regression tree-based method—that includes several steps and machine learning algorithms [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. The methodology is inspired by a clustering methodology designed by Breiman and Cutler [<xref ref-type="bibr" rid="ref19">19</xref>], the creators of RFs [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <p>In a preprocessing step, we extracted 34 PCGs as the only input feature for the clustering procedure. We grouped the 34 PCGs into 15 disease categories, which were valued meaningful from a clinical perspective (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). We then considered the first year of information only, and extracted a 10% random sample, to allow for effective processing for the computationally expensive steps. To confirm the results, the random sampling was performed multiple times, which led to similar clusters. Finally, we discarded points showing no PCG or only one type of PCG. Since we ultimately use an algorithm to detect clusters based on density given by the distances between points, the presence of many identical points at the same positions may perturb the algorithm and unnecessarily make the computation more expensive. Keeping a small random sample of these points would reduce the perturbation but not change the results while adding a dispensable complication, notably for the hyperparameter selection needed to detect these additional clusters.</p>
        <p>To initiate the clustering procedure, we created a synthetic data set of the same size as the original data, by random sampling from the distributions of each input variable within the data. The idea is then to train an RF model to classify synthetic and original points, with the aim of taking advantage of the <italic>proximity</italic> measure, an embedded RF metric of similarity between points. An RF aggregates the prediction of multiple decision trees (DTs) by considering the class they predict in majority. DTs are classification models that separate the data points into subspaces (leaves) by imposing thresholds on the input variables and predicting the class within each subspace as the majority class. The proximity between two points is then computed as the number of times they fall in the same leaf across the trees in the forest. To stabilize the random effects of RFs, we trained 10 RF models, computed the proximities for all pairs of points for each model, and averaged them to obtain a mean proximity matrix characterizing the data. We then used multidimensional scaling (MDS) [<xref ref-type="bibr" rid="ref22">22</xref>] to project the corresponding distance matrix (1 – proximity matrix / (number of trees)) in 2D while preserving the distances and allow for visualization of the resulting clusters. Finally, we applied hierarchical density-based spatial clustering of applications with noise (HDBSCAN) [<xref ref-type="bibr" rid="ref23">23</xref>] to detect clusters within the obtained 2D data, after discarding the synthetic points from the data. HDBSCAN extracts clusters as dense gatherings of points separated by sparse regions with few points. Given that no cross-validation is possible with clustering methodologies, reasonable hyperparameters were chosen for the RF, MDS, and HDBSCAN steps based on various metrics embedded in the algorithms and the clinical relevance of the obtained clusters. The metrics includes the <italic>out-of-bag</italic> (<italic>OOB</italic>) misclassification error, which shows how well RF differentiates the original data from the synthetic one. The outcome reflects how much structure there is in the data [<xref ref-type="bibr" rid="ref19">19</xref>]. Another metric was <italic>normalized stress</italic>, measuring whether the distances between points are reasonably preserved after projection [<xref ref-type="bibr" rid="ref22">22</xref>], and the <italic>cluster persistence</italic>, HDBSCAN embedded metrics indicating how well the clusters are defined and separated from each other [<xref ref-type="bibr" rid="ref23">23</xref>]. In practice, we used the HDBSCAN and Scikit-learn libraries (in Python) for the final clustering and all previous steps.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>After discarding individuals with missing information, our data set comprised 18,732 individuals (<italic>points</italic>). An initial examination of the data set exhibited three large “single” clusters that we extracted prior to the clustering procedure, showing no PCGs, only hypertension PCGs, and only mental disease PCGs, representing 67.9% (n=12,720), 9.7% (n=1813), and 4.1% (n=765) of the population, respectively. Clustering analyses, performed on the remaining 3434 patients not included in the latter “single” clusters, identified four distinct clusters: Cluster 0 to Cluster 3, numbered in the order in which they are detected while applying HDBSCAN (<xref rid="figure1" ref-type="fig">Figure 1</xref>). The clusters can be clearly visualized from this tree (<xref rid="figure2" ref-type="fig">Figure 2</xref>); and a good persistence of 0.29, 0.24, 0.15, and 0.24, respectively, was found. The average OOB misclassification error from the 10 RFs was 0.51, which is quite high, showing that RF does not differentiate well between the original and the synthetic data, and there is not much structure in the data. Regarding the performed MDS, the normalized stress was 0.31, indicating reasonable preserving of the distances between points.</p>
      <p>The 4 detected clusters encompass different mixes of PCGs (<xref ref-type="table" rid="table1">Table 1</xref> and <xref rid="figure3" ref-type="fig">Figure 3</xref>): Cluster 0 comprises a large mix of PCGs (mental + hypertension + pain + asthma [chronic obstructive pulmonary disease]) often appearing jointly; Cluster 1 comprises PCGs (thyroid, hypertension, glaucoma, and mix of others) appearing jointly less often; Cluster 2 comprises asthma, Parkinson, cardiac diseases, and pain rarely appearing jointly; and Cluster 3 comprises a large mix of PCGs almost never appearing jointly (single diseases).</p>
      <p>The following description and interpretation of clusters is based on the descriptive statistics of health care use and costs data (<xref ref-type="table" rid="table1">Table 1</xref>), which help to understand the underlying principle of grouping individuals into PCG clusters. First, the members of Cluster 0 (n=817, 4.4%) had the highest number of PCGs and highest costs and health care use, and were referred to as “complex high-cost high-need patients” (for a detailed description, see <xref ref-type="table" rid="table1">Table 1</xref>). The degree of complexity in these settings was reflected as the combination of the following characteristics interpreted from descriptive statistics (<xref ref-type="table" rid="table1">Table 1</xref>): average number of PCGs, percentage of multimorbid patients, levels of health care use (eg, number of doctor consultations and hospital stays), and costs in the population subgroup. The members of Cluster 1 (n=709, 3.8%), although having multiple PCGs, had health care costs and use lower than in Cluster 0; thus, they were referred to as “slightly complex with inexpensive low-severity PCGs.” The members of Cluster 2 (n=531, 2.8%) were of the oldest age and presented especially high use of hospitalizations and visits to the generalist doctor and, thus, were referred to as “oldest at high risk.” High risk, interpreted in these settings from the descriptive statistics, was reflected by relatively high use of hospital care, yet lower than in the most complex cluster: long length of stay (5.6 and 6.6 nights for clusters “Oldest at risk” and “Complex high-cost high-need,” respectively) and high inpatient costs (CHF 2749 [US $2950] and CHF 3109 [US $3333], respectively). The members of Cluster 3 (n=1056, 5.6%) were characterized by a relatively small number of PCGs (close to 1) and the highest costs of medications and, thus, were referred to as “patients with 1 costly disease.”</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>MDS projection of the data in two dimensions. The four clusters found by HDBSCAN are marked by the different colors and coded with the labels 0, 1, 2, and 3. The code –1 refers to the outliers. HDBSCAN: hierarchical density-based spatial clustering of applications with noise; MDS: multidimensional scaling.</p>
        </caption>
        <graphic xlink:href="medinform_v10i4e34274_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Condensed tree resulting from the hierarchical density-based spatial clustering of applications with noise algorithm performed on the data. Note: similar to a classical dendogram in a hierarchical clustering setting, the first yellow rectangle represents the entire data, which is split into two parts (called “branches”) when we reduce the maximum distance allowed between points within each branch (λ value = 1 / distance). Each rectangle represents a subpart of the data after a split and with a size proportional to the number of data points in the subpart. The entire data splits into cluster 0 and the green rectangle, which further splits into cluster 1 and a turquoise rectangle, when we reduce the distance allowed. The 4 detected clusters (signified by a circle and their number) are the branches that persist the most (do not split further, according to various rules of the algorithm) when the imposed maximum distance between points decreases while keeping a minimum size. The persistence is proportional to the length of the rectangles across the vertical axis. The tree can be interpreted as a probability distribution function upside down, with each cluster being a peak in the distribution.</p>
        </caption>
        <graphic xlink:href="medinform_v10i4e34274_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Descriptive statistics of clusters.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="120"/>
          <col width="0"/>
          <col width="70"/>
          <col width="0"/>
          <col width="80"/>
          <col width="0"/>
          <col width="100"/>
          <col width="0"/>
          <col width="100"/>
          <col width="0"/>
          <col width="100"/>
          <col width="0"/>
          <col width="110"/>
          <col width="0"/>
          <col width="90"/>
          <col width="0"/>
          <col width="90"/>
          <col width="0"/>
          <col width="110"/>
          <thead>
            <tr valign="top">
              <td colspan="3">Statistics</td>
              <td colspan="2">All data</td>
              <td colspan="2">Outliers</td>
              <td colspan="2">Cluster 0 “Complex high-cost high-need”</td>
              <td colspan="2">Cluster 1 “Slightly complex with inexpensive low-severity PCGs<sup>a</sup>”</td>
              <td colspan="2">Cluster 2 “Oldest at high risk”</td>
              <td colspan="2">Cluster 3 “Patients with 1 costly disease”</td>
              <td colspan="2">No PCGs</td>
              <td colspan="2">Hypertension “Only hypertension”</td>
              <td>Mental health “Only mental diseases”</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="3">Patients, n (%)</td>
              <td colspan="2">18,732 <break/>(100.0)</td>
              <td colspan="2">321 <break/>(1.7)</td>
              <td colspan="2">817 <break/>(4.4)</td>
              <td colspan="2">709 <break/>(3.8)</td>
              <td colspan="2">531 <break/>(2.8)</td>
              <td colspan="2">1056 <break/>(5.6)</td>
              <td colspan="2">12,720 <break/>(67.9)</td>
              <td colspan="2">1813 <break/>(9.7)</td>
              <td>765 <break/>(4.1)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Age (years), mean (SD)</td>
              <td colspan="2">65.0 <break/>(10.6)</td>
              <td colspan="2">66.3 <break/>(10.8)</td>
              <td colspan="2">66.3 <break/>(10.6)</td>
              <td colspan="2">67.8 <break/>(10.2)</td>
              <td colspan="2">69.4 <break/>(10.9)</td>
              <td colspan="2">68.1 <break/>(11.2)</td>
              <td colspan="2">64.0 <break/>(10.4)</td>
              <td colspan="2">67.6 <break/>(9.7)</td>
              <td>63.2 <break/>(10.9)</td>
            </tr>
            <tr valign="top">
              <td colspan="20">
                <bold>Sex, n (%)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Men</td>
              <td colspan="2">8626 <break/>(46)</td>
              <td colspan="2">130 <break/>(40)</td>
              <td colspan="2">325 <break/>(40)</td>
              <td colspan="2">205 <break/>(29)</td>
              <td colspan="2">279 <break/>(53)</td>
              <td colspan="2">536 <break/>(51)</td>
              <td colspan="2">5772 <break/>(45)</td>
              <td colspan="2">1158 <break/>(64)</td>
              <td colspan="2">221 <break/>(29)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Women</td>
              <td colspan="2">10,106 <break/>(54)</td>
              <td colspan="2">191 <break/>(60)</td>
              <td colspan="2">492 <break/>(60)</td>
              <td colspan="2">504 <break/>(71)</td>
              <td colspan="2">252 <break/>(47)</td>
              <td colspan="2">520 <break/>(49)</td>
              <td colspan="2">6948 <break/>(55)</td>
              <td colspan="2">655 <break/>(36)</td>
              <td colspan="2">544 <break/>(71)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Deductible (CHF; US $), mean</td>
              <td colspan="2">794 <break/>(852)</td>
              <td colspan="2">511 <break/>(548)</td>
              <td colspan="2">448 <break/>(481)</td>
              <td colspan="2">535 <break/>(574)</td>
              <td colspan="2">524 <break/>(562)</td>
              <td colspan="2">562 <break/>(603)</td>
              <td colspan="2">908 <break/>(974)</td>
              <td colspan="2">612 <break/>(657)</td>
              <td>558 <break/>(599)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Model with <break/>gatekeeper<sup>b</sup></td>
              <td colspan="2">0.5</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.5</td>
              <td colspan="2">0.5</td>
              <td>0.5</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Number of PCGs, mean</td>
              <td colspan="2">0.4</td>
              <td colspan="2">1.2</td>
              <td colspan="2">2.1</td>
              <td colspan="2">1.7</td>
              <td colspan="2">1.3</td>
              <td colspan="2">1.1</td>
              <td colspan="2">0.0</td>
              <td colspan="2">1.0</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Multimorbid (yes)<sup>b</sup></td>
              <td colspan="2">0.1</td>
              <td colspan="2">0.1</td>
              <td colspan="2">0.8</td>
              <td colspan="2">0.6</td>
              <td colspan="2">0.3</td>
              <td colspan="2">0.1</td>
              <td colspan="2">0.0</td>
              <td colspan="2">0.0</td>
              <td>0.0</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Ambulatory costs (CHF; US $), mean</td>
              <td colspan="2">5395 <break/>(5789)</td>
              <td colspan="2">7967 <break/>(8549)</td>
              <td colspan="2">11,731 <break/>(12,589)</td>
              <td colspan="2">7477 <break/>(8024)</td>
              <td colspan="2">9728 <break/>(10,439)</td>
              <td colspan="2">10,362 <break/>(11,120)</td>
              <td colspan="2">4074 <break/>(4372)</td>
              <td colspan="2">5462 <break/>(5861)</td>
              <td>7571 <break/>(8125)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Inpatient costs (CHF; US $), mean</td>
              <td colspan="2">1419 <break/>(1523)</td>
              <td colspan="2">2134 <break/>(2290)</td>
              <td colspan="2">3109 <break/>(3336)</td>
              <td colspan="2">1811 <break/>(1943)</td>
              <td colspan="2">2749 <break/>(2950)</td>
              <td colspan="2">1575 <break/>(1690)</td>
              <td colspan="2">1199 <break/>(1287)</td>
              <td colspan="2">1372 <break/>(1472)</td>
              <td>1585 <break/>(1701)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Costs of medications (CHF; US $), mean</td>
              <td colspan="2">1563 <break/>(1677)</td>
              <td colspan="2">2683 <break/>(2879)</td>
              <td colspan="2">4073 <break/>(4371)</td>
              <td colspan="2">2221 <break/>(2383)</td>
              <td colspan="2">3587 <break/>(3849)</td>
              <td colspan="2">4450 <break/>(4775)</td>
              <td colspan="2">965 <break/>(1036)</td>
              <td colspan="2">1732 <break/>(1859)</td>
              <td>1961 <break/>(2104)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Total cost (CHF; US $), mean</td>
              <td colspan="2">8929 <break/>(9582)</td>
              <td colspan="2">13,684 <break/>(14,684)</td>
              <td colspan="2">19,950 <break/>(21,409)</td>
              <td colspan="2">12,440 <break/>(13,349)</td>
              <td colspan="2">17,057 <break/>(18,304)</td>
              <td colspan="2">17,312 <break/>(18,578)</td>
              <td colspan="2">6611 <break/>(7094)</td>
              <td colspan="2">9439 <break/>(10,129)</td>
              <td>12,025 <break/>(12,904)</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Number of days in the hospital, mean</td>
              <td colspan="2">2.6</td>
              <td colspan="2">4.3</td>
              <td colspan="2">6.6</td>
              <td colspan="2">3.6</td>
              <td colspan="2">5.6</td>
              <td colspan="2">3.4</td>
              <td colspan="2">2.0</td>
              <td colspan="2">2.4</td>
              <td>3.5</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Number of hospitalizations in a year, mean</td>
              <td colspan="2">0.2</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.5</td>
              <td colspan="2">0.3</td>
              <td colspan="2">0.4</td>
              <td colspan="2">0.3</td>
              <td colspan="2">0.2</td>
              <td colspan="2">0.3</td>
              <td>0.3</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Total number of consultations, mean</td>
              <td colspan="2">11.9</td>
              <td colspan="2">16.0</td>
              <td colspan="2">20.2</td>
              <td colspan="2">17.0</td>
              <td colspan="2">17.5</td>
              <td colspan="2">16.1</td>
              <td colspan="2">9.9</td>
              <td colspan="2">12.7</td>
              <td>18.5</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Number of consultations with generalist, mean</td>
              <td colspan="2">7.2</td>
              <td colspan="2">10.0</td>
              <td colspan="2">11.6</td>
              <td colspan="2">9.8</td>
              <td colspan="2">11.3</td>
              <td colspan="2">9.4</td>
              <td colspan="2">6.0</td>
              <td colspan="2">8.3</td>
              <td>9.5</td>
            </tr>
            <tr valign="top">
              <td colspan="3">PCG groups in the cluster</td>
              <td colspan="2">All 34 PCGs</td>
              <td colspan="2">Mostly Pain</td>
              <td colspan="2">Mental + hypertension + pain + asthma (COPD<sup>c</sup>)</td>
              <td colspan="2">Thyroid + hypertension + glaucoma + mix of others</td>
              <td colspan="2">Asthma + Parkinson + cardiac diseases + pain</td>
              <td colspan="2">Cancer + diabetes + inflammatory + immune + other mental + glaucoma + HIV</td>
              <td colspan="2">N/A<sup>d</sup></td>
              <td colspan="2">Hypertension</td>
              <td>Mental diseases</td>
            </tr>
            <tr valign="top">
              <td colspan="3">Description of the clusters based on overall descriptive statistics</td>
              <td colspan="2">N/A</td>
              <td colspan="2">Average age, slightly fewer male patients, higher hospital costs and hospital stays</td>
              <td colspan="2">Average age, slightly fewer male patients, lowest deductibles, highest amount of PCGs and multimorbidity, highest health care use and costs (except for costs of medications)</td>
              <td colspan="2">Slightly older, more female patients, relatively low deductibles, high amount of PCGs (1.7) and multimorbidity (but less than cluster 0), relatively low health care use and costs</td>
              <td colspan="2">Oldest, relatively low deductibles, some complexity (more than 1 PCGs on average), very high use of doctor visits (especially generalist), many hospitalizations and high inpatient costs</td>
              <td colspan="2">Relatively old, on average 1 PCG, highest cost of medicaments, and high ambulatory costs, relatively low hospitalizations and doctor visits</td>
              <td colspan="2">Young, highest deductibles, low health care use and costs</td>
              <td colspan="2">Slightly older, more male patients, relatively low health care use and costs</td>
              <td>Youngest, more female patients, relatively low deductibles, low health care use and costs (but higher than for hypertension group), a lot of visits to doctors</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>PCG: pharmacy-based cost group.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>Ratios rounded off to one decimal place.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup>COPD: chronic obstructive pulmonary disease.</p>
          </fn>
          <fn id="table1fn4">
            <p><sup>d</sup>N/A: not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Joint distributions of PCGs within the 4 clusters (group 0-3) and outliers (group –1). PCG: pharmacy-based cost group.</p>
        </caption>
        <graphic xlink:href="medinform_v10i4e34274_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Our study shows that performing cluster analysis to explore patient multimorbidity and complexity is feasible. We demonstrated that individuals with single PCGs of mental diseases or hypertension, individuals with multiple PCGs, or individuals with a single high-cost PCG have different health care use patterns and represent different complexity groups.</p>
      <p>Earlier studies focusing on chronic conditions identified from electronic health records evidenced the existence of systematic associations between chronic diseases, whereby chronic diseases, often from dissimilar disease categories, coappeared within a multimorbidity pattern or cluster [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Importantly, though, these studies showed that the complexity of multimorbidity patterns in terms of diseases and associated drug use increased with age, which holds true for both genders. Moreover, in line with our findings, multiple earlier studies used cluster analysis for identifying clinically homogenous multimorbidity patterns in the population, where clusters were composed of diagnosis-related groups [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref30">30</xref>]. However, these studies used measures of multimorbidity and comorbidity or clinical diagnosis data rather than PCGs from claims data. This makes direct comparison of results challenging, due to the differences in methodologies and level of diagnosis details. A recent systematic review confirmed that analytical methods used to identify patient profiles with multimorbid conditions are heterogeneous (including factor analysis, multiple correspondence analysis, hierarchical clustering, and three-step unified-clustering method), which may explain the variation in the multimorbidity patterns reported in various studies [<xref ref-type="bibr" rid="ref31">31</xref>]. Despite those differences, the observed most prevalent clusters or groups are similar across studies and included hypertensive or metabolic diseases [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>] and mental and behavioral diseases [<xref ref-type="bibr" rid="ref16">16</xref>]. The greater prevalence of and similarities in metabolic and mental clusters were confirmed by a systematic review of multimorbidity patterns, whereby these clusters were identified in 9 and 10 of 14 reviewed articles, respectively [<xref ref-type="bibr" rid="ref32">32</xref>]. One study compared multimorbidity patterns between populations of two European countries (Spain and the Netherlands) and found that, indeed, the highest similarities were observed in the cardio metabolic cluster, even though the populations are likely to differ across countries [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>The existing literature on the use of cluster analysis to identify homogenous segments based on health care use and expenditures is limited [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. Specifically, the study by Nnoaham and Cann [<xref ref-type="bibr" rid="ref33">33</xref>] identified segments (or clusters), similar to ours, based on health care use (expressed by visits to the physicians, medications, and admissions) and complexity (expressed by long-term conditions). Other studies used cluster analysis to identify groups with high expenditures and deduced that, despite having a lot of heterogeneity, the high expenditures cluster typically exhibited fair or poor health with more medical conditions or comorbidities [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. These findings confirm ours; they nevertheless need to be interpreted with caution due to differences in methodologies, age of the population, and level of details available for background individual characteristics and diagnoses. There is evidence that cluster analysis may provide more information to decision makers than a list of possible statistically significant variables or a list of individuals who are the highest users [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      <p>To our knowledge, this is the first study using cluster analysis to explore patients’ multimorbidity and complexity, reflected by the mix of PCGs and health care use patterns. In addition, it benefits from the richness of health care use data, a large sample size, and advanced clustering methods. However, the study has certain limitations. The first limitation stems from the process of multiple parameters configuration, which increases complexity while not allowing results validation. Thus, the cluster interpretation has to rely on metrics from the algorithms, descriptive statistics, and clinical relevance. Second, as the data were lacking clinical information, we only relied on PCGs mapping, which may give an incomplete picture of drug data [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>Our study shows that PCG-based cluster analysis of health care use claims data allows diverting from an approach of simple comorbidity counts and can identify the population profiles with increased health care use and costs. Such results may provide insightful information for policy making, care planning, and care delivery to facilitate the transformation from procedures and guidelines focusing on a single disease toward development of integrated and better coordinated care.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Lists of pharmacy-based cost groups used to identify chronic diseases in insurance claims data.</p>
        <media xlink:href="medinform_v10i4e34274_app1.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DT</term>
          <def>
            <p>decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HDBSCAN</term>
          <def>
            <p>hierarchical density-based spatial clustering of applications with noise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MDS</term>
          <def>
            <p>multidimensional scaling</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">OOB</term>
          <def>
            <p>out-of-bag</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PCG</term>
          <def>
            <p>pharmacy-based cost group</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Swiss National Science Foundation within the Smarter health care—National Research Programme (NRP 74) and grant 407440_183447.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prince</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez Robledo</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yusuf</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The burden of disease in older people and implications for health policy and practice</article-title>
          <source>Lancet</source>
          <year>2015</year>
          <month>02</month>
          <day>07</day>
          <volume>385</volume>
          <issue>9967</issue>
          <fpage>549</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(14)61347-7</pub-id>
          <pub-id pub-id-type="medline">25468153</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(14)61347-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bachmann</surname>
              <given-names>N.</given-names>
            </name>
            <name name-style="western">
              <surname>Burla</surname>
              <given-names>L.</given-names>
            </name>
            <name name-style="western">
              <surname>Kohler</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>La santé en Suisse – Le point sur les maladies chroniques: Rapport national sur la santé 2015</article-title>
          <source>OBSAN</source>
          <year>2015</year>
          <access-date>2022-03-16</access-date>
          <publisher-loc>Berne</publisher-loc>
          <publisher-name>Hogrefe Verlag</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.obsan.admin.ch/sites/default/files/2021-08/rapportsante_2015_f_0.pdf">https://www.obsan.admin.ch/sites/default/files/2021-08/rapportsante_2015_f_0.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>O'Dowd</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fortin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Interventions for improving outcomes in patients with multimorbidity in primary care and community settings</article-title>
          <source>Cochrane Database Syst Rev</source>
          <year>2021</year>
          <month>01</month>
          <day>15</day>
          <volume>1</volume>
          <fpage>CD006560</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33448337"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/14651858.CD006560.pub4</pub-id>
          <pub-id pub-id-type="medline">33448337</pub-id>
          <pub-id pub-id-type="pmcid">PMC8092473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>O'Dowd</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fortin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Interventions for improving outcomes in patients with multimorbidity in primary care and community settings</article-title>
          <source>Cochrane Database Syst Rev</source>
          <year>2016</year>
          <month>03</month>
          <day>14</day>
          <volume>3</volume>
          <fpage>CD006560</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26976529"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/14651858.CD006560.pub3</pub-id>
          <pub-id pub-id-type="medline">26976529</pub-id>
          <pub-id pub-id-type="pmcid">PMC6703144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Souza</surname>
              <given-names>DLB</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveras-Fabregas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minobes-Molina</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>de Camargo Cancela</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Galbany-Estragués</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jerez-Roig</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Trends of multimorbidity in 15 European countries: a population-based study in community-dwelling adults aged 50 and over</article-title>
          <source>BMC Public Health</source>
          <year>2021</year>
          <month>01</month>
          <day>07</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>76</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-020-10084-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-020-10084-x</pub-id>
          <pub-id pub-id-type="medline">33413239</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-020-10084-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC7792098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pefoyo</surname>
              <given-names>AJK</given-names>
            </name>
            <name name-style="western">
              <surname>Bronskill</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Gruneir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Calzavara</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thavorn</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Petrosyan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Maxwell</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wodchis</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>The increasing burden and complexity of multimorbidity</article-title>
          <source>BMC Public Health</source>
          <year>2015</year>
          <month>04</month>
          <day>23</day>
          <volume>15</volume>
          <fpage>415</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-015-1733-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-015-1733-2</pub-id>
          <pub-id pub-id-type="medline">25903064</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-015-1733-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC4415224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Amelung</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Suter</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nolte</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Balicer</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Handbook Integrated Care</source>
          <year>2017</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharabiani</surname>
              <given-names>MTA</given-names>
            </name>
            <name name-style="western">
              <surname>Aylin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bottle</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Systematic review of comorbidity indices for administrative data</article-title>
          <source>Med Care</source>
          <year>2012</year>
          <month>12</month>
          <volume>50</volume>
          <issue>12</issue>
          <fpage>1109</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e31825f64d0</pub-id>
          <pub-id pub-id-type="medline">22929993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huber</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Szucs</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Rapold</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Identifying patients with chronic conditions using pharmacy data in Switzerland: an updated mapping approach to the classification of medications</article-title>
          <source>BMC Public Health</source>
          <year>2013</year>
          <month>10</month>
          <day>30</day>
          <volume>13</volume>
          <fpage>1030</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/1471-2458-13-1030"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2458-13-1030</pub-id>
          <pub-id pub-id-type="medline">24172142</pub-id>
          <pub-id pub-id-type="pii">1471-2458-13-1030</pub-id>
          <pub-id pub-id-type="pmcid">PMC3840632</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huber</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Schneeweiss</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Signorell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Improved prediction of medical expenditures and health care utilization using an updated chronic disease score and claims data</article-title>
          <source>J Clin Epidemiol</source>
          <year>2013</year>
          <month>10</month>
          <volume>66</volume>
          <issue>10</issue>
          <fpage>1118</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2013.04.011</pub-id>
          <pub-id pub-id-type="medline">23845184</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(13)00172-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamers</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>van Vliet</surname>
              <given-names>RCJA</given-names>
            </name>
          </person-group>
          <article-title>The Pharmacy-based Cost Group model: validating and adjusting the classification of medications for chronic conditions to the Dutch situation</article-title>
          <source>Health Policy</source>
          <year>2004</year>
          <month>04</month>
          <volume>68</volume>
          <issue>1</issue>
          <fpage>113</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1016/j.healthpol.2003.09.001</pub-id>
          <pub-id pub-id-type="medline">15033558</pub-id>
          <pub-id pub-id-type="pii">S0168851003001623</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pezzotti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Orzella</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Borgia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Guasticchi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Can we use the pharmacy data to estimate the prevalence of chronic conditions? a comparison of multiple data sources</article-title>
          <source>BMC Public Health</source>
          <year>2011</year>
          <month>09</month>
          <day>05</day>
          <volume>11</volume>
          <fpage>688</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/1471-2458-11-688"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2458-11-688</pub-id>
          <pub-id pub-id-type="medline">21892946</pub-id>
          <pub-id pub-id-type="pii">1471-2458-11-688</pub-id>
          <pub-id pub-id-type="pmcid">PMC3223740</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Whitson</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Sloane</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cigolle</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Pieper</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Landerman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hastings</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Identifying patterns of multimorbidity in older Americans: application of latent class analysis</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2016</year>
          <month>08</month>
          <volume>64</volume>
          <issue>8</issue>
          <fpage>1668</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27309908"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jgs.14201</pub-id>
          <pub-id pub-id-type="medline">27309908</pub-id>
          <pub-id pub-id-type="pmcid">PMC4988894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khalid</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Prieto-Alhambra</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for feature selection and cluster analysis in drug utilisation research</article-title>
          <source>Curr Epidemiol Rep</source>
          <year>2019</year>
          <month>7</month>
          <day>27</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>364</fpage>
          <lpage>372</lpage>
          <pub-id pub-id-type="doi">10.1007/s40471-019-00211-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wartelle</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mourad-Chehade</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yalaoui</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chrusciel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Laplanche</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Clustering of a health dataset using diagnosis co-occurrences</article-title>
          <source>Appl Sci</source>
          <year>2021</year>
          <month>03</month>
          <day>07</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>2373</fpage>
          <pub-id pub-id-type="doi">10.3390/app11052373</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Violán</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Roso-Llorach</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Foguet-Boreu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Guisado-Clavero</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pons-Vigués</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pujol-Ribera</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Valderas</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity patterns with K-means nonhierarchical cluster analysis</article-title>
          <source>BMC Fam Pract</source>
          <year>2018</year>
          <month>07</month>
          <day>03</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>108</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcfampract.biomedcentral.com/articles/10.1186/s12875-018-0790-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12875-018-0790-x</pub-id>
          <pub-id pub-id-type="medline">29969997</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12875-018-0790-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6031109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Polynomics AG</collab>
          </person-group>
          <article-title>Aktualisierung der PCG-Liste für den Schweizer Risikoausgleich</article-title>
          <source>Studie im Auftrag des Bundesamts für Gesundheit BAG - Schlussbericht</source>
          <year>2019</year>
          <access-date>2020-03-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bag.admin.ch/dam/bag/en/dokumente/kuv-aufsicht/pus/risikoausgleich/corrigendun.pdf.download.pdf/Polynomics_Uni_Basel_Aktualisierung_PCG_Schlussbericht_2019-01-22.pdf">https://www.bag.admin.ch/dam/bag/en/dokumente/kuv-aufsicht/pus/risikoausgleich/corrigendun.pdf.download.pdf/Polynomics_Uni_Basel_Aktualisierung_PCG_Schlussbericht_2019-01-22.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Random forests</article-title>
          <source>Machine Learning</source>
          <year>2001</year>
          <volume>45</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cutler</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Random Forests Manual v4.0</article-title>
          <source>UC Berkeley</source>
          <year>2003</year>
          <access-date>2020-10-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.stat.berkeley.edu/~breiman/Using_random_forests_v4.0.pdf">https://www.stat.berkeley.edu/~breiman/Using_random_forests_v4.0.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Seligson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Belldegrun</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Palotie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Horvath</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Tumor classification by tissue microarray profiling: random forest clustering applied to renal cell carcinoma</article-title>
          <source>Mod Pathol</source>
          <year>2005</year>
          <month>04</month>
          <volume>18</volume>
          <issue>4</issue>
          <fpage>547</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1038/modpathol.3800322</pub-id>
          <pub-id pub-id-type="medline">15529185</pub-id>
          <pub-id pub-id-type="pii">3800322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Horvath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kraft</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Spiteri</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Riggs</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Marahrens</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>High concentrations of long interspersed nuclear element sequence distinguish monoallelically expressed genes</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2003</year>
          <month>08</month>
          <day>19</day>
          <volume>100</volume>
          <issue>17</issue>
          <fpage>9940</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12909712"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1737401100</pub-id>
          <pub-id pub-id-type="medline">12909712</pub-id>
          <pub-id pub-id-type="pii">1737401100</pub-id>
          <pub-id pub-id-type="pmcid">PMC187893</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kruskal</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Wish</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Multidimensional scaling</article-title>
          <source>Multidimensional Scaling. Quantitative Applications in the Social Sciences, ed. I</source>
          <year>1978</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Healy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Astels</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>hdbscan: hierarchical density based clustering</article-title>
          <source>J Open Source Software</source>
          <year>2017</year>
          <month>03</month>
          <volume>2</volume>
          <issue>11</issue>
          <fpage>205</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.00205</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ioakeim-Skoufa</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Poblador-Plou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Carmona-Pírez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Díez-Manglano</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Navickas</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gimeno-Feliu</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>González-Rubio</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jureviciene</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dambrauskas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Prados-Torres</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gimeno-Miguel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity patterns in the general population: results from the EpiChron cohort study</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>06</month>
          <day>14</day>
          <volume>17</volume>
          <issue>12</issue>
          <fpage>4242</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17124242"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17124242</pub-id>
          <pub-id pub-id-type="medline">32545876</pub-id>
          <pub-id pub-id-type="pii">ijerph17124242</pub-id>
          <pub-id pub-id-type="pmcid">PMC7345112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mucherino</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gimeno-Miguel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Carmona-Pirez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Rubio</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ioakeim-Skoufa</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno-Juste</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Orlando</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Aza-Pascual-Salcedo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Poblador-Plou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Menditto</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Prados-Torres</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Changes in multimorbidity and polypharmacy patterns in young and adult population over a 4-year period: a 2011-2015 comparison using real-world data</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2021</year>
          <month>04</month>
          <day>21</day>
          <volume>18</volume>
          <issue>9</issue>
          <fpage>4422</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph18094422"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph18094422</pub-id>
          <pub-id pub-id-type="medline">33919351</pub-id>
          <pub-id pub-id-type="pii">ijerph18094422</pub-id>
          <pub-id pub-id-type="pmcid">PMC8122591</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poblador-Plou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>van den Akker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Calderón-Larrañaga</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Metsemakers</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Prados-Torres</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Similar multimorbidity patterns in primary care patients from two European regions: results of a factor analysis</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>6</issue>
          <fpage>e100375</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0100375"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0100375</pub-id>
          <pub-id pub-id-type="medline">24956475</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-45413</pub-id>
          <pub-id pub-id-type="pmcid">PMC4067297</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Déruaz-Luyet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>N'Goran</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Senn</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bodenmann</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pasquier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Widmer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tandjung</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rosemann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Frey</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Streit</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haller</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Excoffier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Burnand</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Herzig</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity and patterns of chronic conditions in a primary care population in Switzerland: a cross-sectional study</article-title>
          <source>BMJ Open</source>
          <year>2017</year>
          <month>07</month>
          <day>02</day>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>e013664</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=28674127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-013664</pub-id>
          <pub-id pub-id-type="medline">28674127</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-013664</pub-id>
          <pub-id pub-id-type="pmcid">PMC5734197</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marengoni</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rizzuto</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Winblad</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fratiglioni</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Patterns of chronic multimorbidity in the elderly population</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2009</year>
          <month>02</month>
          <volume>57</volume>
          <issue>2</issue>
          <fpage>225</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1532-5415.2008.02109.x</pub-id>
          <pub-id pub-id-type="medline">19207138</pub-id>
          <pub-id pub-id-type="pii">JGS2109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guisado-Clavero</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Roso-Llorach</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>López-Jimenez</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pons-Vigués</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Foguet-Boreu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Violán</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity patterns in the elderly: a prospective cohort study with cluster analysis</article-title>
          <source>BMC Geriatr</source>
          <year>2018</year>
          <month>01</month>
          <day>16</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgeriatr.biomedcentral.com/articles/10.1186/s12877-018-0705-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12877-018-0705-7</pub-id>
          <pub-id pub-id-type="medline">29338690</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12877-018-0705-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5771078</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Egan</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Sutherland</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Tilkemeier</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Rutledge</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sinopoli</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A cluster-based approach for integrating clinical management of Medicare beneficiaries with multiple chronic conditions</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>e0217696</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0217696"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0217696</pub-id>
          <pub-id pub-id-type="medline">31216301</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-33018</pub-id>
          <pub-id pub-id-type="pmcid">PMC6584004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Tawiah</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sawyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Scuffham</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Patterns of multimorbid health conditions: a systematic review of analytical methods and comparison analysis</article-title>
          <source>Int J Epidemiol</source>
          <year>2018</year>
          <month>10</month>
          <day>01</day>
          <volume>47</volume>
          <issue>5</issue>
          <fpage>1687</fpage>
          <lpage>1704</lpage>
          <pub-id pub-id-type="doi">10.1093/ije/dyy134</pub-id>
          <pub-id pub-id-type="medline">30016472</pub-id>
          <pub-id pub-id-type="pii">5054718</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prados-Torres</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Calderón-Larrañaga</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hancco-Saavedra</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poblador-Plou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>van den Akker</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity patterns: a systematic review</article-title>
          <source>J Clin Epidemiol</source>
          <year>2014</year>
          <month>03</month>
          <volume>67</volume>
          <issue>3</issue>
          <fpage>254</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2013.09.021</pub-id>
          <pub-id pub-id-type="medline">24472295</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(13)00436-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nnoaham</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Cann</surname>
              <given-names>KF</given-names>
            </name>
          </person-group>
          <article-title>Can cluster analyses of linked healthcare data identify unique population segments in a general practice-registered population?</article-title>
          <source>BMC Public Health</source>
          <year>2020</year>
          <month>05</month>
          <day>27</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>798</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-020-08930-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-020-08930-z</pub-id>
          <pub-id pub-id-type="medline">32460753</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-020-08930-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC7254635</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Powers</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Linn</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kowalski</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Navathe</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Subgroups of high-cost Medicare advantage patients: an observational study</article-title>
          <source>J Gen Intern Med</source>
          <year>2019</year>
          <month>02</month>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>218</fpage>
          <lpage>225</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30511290"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-018-4759-1</pub-id>
          <pub-id pub-id-type="medline">30511290</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-018-4759-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6374249</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agterberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Crabb</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenberg</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Cluster analysis application to identify groups of individuals with high health expenditures</article-title>
          <source>Health Serv Outcomes Res Method</source>
          <year>2020</year>
          <month>08</month>
          <day>01</day>
          <volume>20</volume>
          <issue>2-3</issue>
          <fpage>140</fpage>
          <lpage>182</lpage>
          <pub-id pub-id-type="doi">10.1007/s10742-020-00214-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Copeland</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Zeber</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Parchman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Valenstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>Patterns of primary care and mortality among patients with schizophrenia or diabetes: a cluster analysis approach to the retrospective study of healthcare utilization</article-title>
          <source>BMC Health Serv Res</source>
          <year>2009</year>
          <month>07</month>
          <day>26</day>
          <volume>9</volume>
          <fpage>127</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmchealthservres.biomedcentral.com/articles/10.1186/1472-6963-9-127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6963-9-127</pub-id>
          <pub-id pub-id-type="medline">19630997</pub-id>
          <pub-id pub-id-type="pii">1472-6963-9-127</pub-id>
          <pub-id pub-id-type="pmcid">PMC2723108</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vuik</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A quantitative evidence base for population health: applying utilization-based cluster analysis to segment a patient population</article-title>
          <source>Popul Health Metr</source>
          <year>2016</year>
          <month>11</month>
          <day>25</day>
          <volume>14</volume>
          <fpage>44</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pophealthmetrics.biomedcentral.com/articles/10.1186/s12963-016-0115-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12963-016-0115-z</pub-id>
          <pub-id pub-id-type="medline">27906004</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12963-016-0115-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC5124281</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
