<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v13i1e73596</article-id>
      <article-id pub-id-type="pmid">41236789</article-id>
      <article-id pub-id-type="doi">10.2196/73596</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Multisource Coherence Analysis of the First European Multicenter Cohort Study for Cancer Prevention in People Experiencing Homelessness: Data Quality Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Estupiñán-Romero</surname>
            <given-names>Francisco</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gejjegondanahalli Yogeshappa</surname>
            <given-names>Vedamurthy</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Blasco-Calafat</surname>
            <given-names>Antonio</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Biomedical Data Science Laboratory</institution>
            <institution>Institute of Information and Communication Technologies</institution>
            <institution>Universitat Politècnica de València</institution>
            <addr-line>Building 8G, 1st Floor, Camino de vera, sn</addr-line>
            <addr-line>Valencia, 46022</addr-line>
            <country>Spain</country>
            <phone>34 963877000 ext 75278</phone>
            <email>anblaca@upv.es</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-4959-2900</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Blanes-Selva</surname>
            <given-names>Vicent</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0056-0329</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Fragner</surname>
            <given-names>Tobias</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1373-5279</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Doñate-Martínez</surname>
            <given-names>Ascensión</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2742-0219</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Alhambra-Borrás</surname>
            <given-names>Tamara</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8595-1969</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Gawronska</surname>
            <given-names>Julia</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-1766-9719</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>Lee</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5340-9833</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Garcia-Gomez</surname>
            <given-names>Juan M</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3851-1557</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Grabovac</surname>
            <given-names>Igor</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9605-1467</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Sáez</surname>
            <given-names>Carlos</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2678-8249</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Biomedical Data Science Laboratory</institution>
        <institution>Institute of Information and Communication Technologies</institution>
        <institution>Universitat Politècnica de València</institution>
        <addr-line>Valencia</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Social and Preventive Medicine</institution>
        <institution>Center for Public Health</institution>
        <institution>Medical University of Vienna</institution>
        <addr-line>Vienna</addr-line>
        <country>Austria</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Instituto de Investigación en Políticas de Bienestar Social</institution>
        <institution>Department of Social and Preventive Medicine</institution>
        <institution>Universitat de València</institution>
        <addr-line>Valencia</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Center for Health, Performance and Wellbeing</institution>
        <institution>Anglia Ruskin University</institution>
        <addr-line>Cambridge</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Antonio Blasco-Calafat <email>anblaca@upv.es</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>11</month>
        <year>2025</year>
      </pub-date>
      <volume>13</volume>
      <elocation-id>e73596</elocation-id>
      <history>
        <date date-type="received">
          <day>7</day>
          <month>3</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>4</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>6</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>8</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Antonio Blasco-Calafat, Vicent Blanes-Selva, Tobias Fragner, Ascensión Doñate-Martínez, Tamara Alhambra-Borrás, Julia Gawronska, Lee Smith, Juan M Garcia-Gomez, Igor Grabovac, Carlos Sáez. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 14.11.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2025/1/e73596" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Coherence across sites in multicenter datasets is one substantial data quality dimension for reliable health data reuse, as unexpected heterogeneity in data can lead to biases in data analyses and suboptimal generalization of results.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This work aims to characterize and label the data coherence across sites in the first European multicenter dataset for cancer prevention in people and early detection among the homeless population in Europe: coadapting and implementing the health navigator model. This dataset emerged to enable research to address disparities in health challenges and health care access due to barriers such as unstable housing, limited resources, and social stigma in people experiencing homelessness.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The dataset comprises 652 cases: 142 from Austria, 158 from Greece, 197 from Spain, and 155 from the United Kingdom. All participants fit classifications from the European Typology of Homelessness and Housing Exclusion. This longitudinal study collected questionnaires at baseline, after 4 weeks, and at the end of the intervention. The 180-question survey covered sociodemographic data, overall health, mental health, empowerment, and interpersonal communication. Data variability was assessed using information theory and geometric methods to analyze discrepancies in distributions and completeness across the dataset.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Substantial variability was observed among the 4 pilot countries, both in the overall analysis and within specific domains. In particular, measures of health care empowerment, quality of life, and interpersonal communication demonstrated the greatest discrepancies among pilot sites, with the exception of the health domain. Notably, Spain exhibited the most pronounced differences, characterized by a high number of missing values related to interpersonal communication and the use of health care services.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Health data may be comparable across the 4 countries; however, substantial differences were observed in the other questionnaires, requiring independent, country-specific analyses. This study underscores the heterogeneity among people experiencing homelessness and the critical need for data quality assessments to inform future research and policymaking in this field.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>homelessness</kwd>
        <kwd>data quality</kwd>
        <kwd>data variability</kwd>
        <kwd>public health</kwd>
        <kwd>data analysis</kwd>
        <kwd>curated dataset</kwd>
        <kwd>multisource</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Homelessness is a complex and multifaceted phenomenon, encompassing more than the mere absence of a physical dwelling. It signifies a state of profound vulnerability and social exclusion, characterized by a lack of stable, safe, or adequate housing [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. The experience of homelessness is deeply intertwined with a range of social, economic, and individual factors, including poverty, unemployment, mental health challenges, substance use, and domestic violence. People experiencing homelessness constitute a highly heterogeneous group with varying backgrounds, needs, and challenges, encompassing socioeconomic, cultural, physical, and mental health aspects, as well as historical and geographical contexts [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. This inherent diversity within the group of people experiencing homelessness, coupled with inconsistent definitions and methodological variations in data collection across countries, makes it exceedingly challenging to accurately estimate the true prevalence of homelessness. Despite these complexities, it is estimated that at least 895,000 individuals in Europe are experiencing homelessness on any given night, living rough or in temporary or emergency accommodations [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Research consistently demonstrates substantial health disparities between people experiencing homelessness and the housed population. Homelessness is associated with poorer health outcomes, including premature mortality, partly due to barriers to accessing health care [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Furthermore, people experiencing homelessness experience higher cancer morbidity, lower cancer screening rates, later-stage cancer diagnoses, and poorer cancer-specific health outcomes compared to the housed population [<xref ref-type="bibr" rid="ref10">10</xref>], with cancer being the second most common cause of death among people experiencing homelessness [<xref ref-type="bibr" rid="ref11">11</xref>]. Among the most relevant factors, people experiencing homelessness usually report low health literacy, especially regarding cancer [<xref ref-type="bibr" rid="ref12">12</xref>], and they tend to experience barriers to accessing fragmented cancer prevention and community health services [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>Research interest in improving the health status and cancer prevention efforts for people experiencing homelessness is growing, leading to the implementation and piloting of innovative health care strategies, such as the patient navigation model and the patient empowerment model [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. In the patient navigation model, patient navigators, defined as health care professionals or peers specializing in care coordination, case management, and reducing barriers to care, play a crucial role in guiding individuals to overcome obstacles and access health care services in a timely manner [<xref ref-type="bibr" rid="ref16">16</xref>]. This includes facilitating access to preventive care and health promotion programs, which have been shown to improve their users’ health outcomes and care satisfaction [<xref ref-type="bibr" rid="ref17">17</xref>]. The patient empowerment model focuses on equipping individuals with the knowledge, skills, and confidence to take an active role in managing their health and navigating the health care system [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. This approach emphasizes self-efficacy and shared decision-making, empowering patients to make informed choices about their health care and advocate for their needs.</p>
      <p>Within the CANCERLESS project, a multicenter study funded by the European Union, critical components of the patient navigation and patient empowerment models have converged into the novel health navigator model. This model was co-designed with input from both people experiencing homelessness and health and social care professionals working with them as well as those working in primary care settings. The project piloted this model in 4 European countries to assess its effectiveness in connecting people experiencing homelessness with cancer prevention services. To the authors’ knowledge, CANCERLESS is the first multicenter study involving people experiencing homelessness from different countries, marking substantial progress in research within this field. However, challenges such as data variability, missing data (missing completely at random and missing not at random), and fragmented in care may introduce biases in the results [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      <p>Building on the premise that various studies have highlighted the inherent heterogeneity within this population [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], this diversity becomes even more pronounced when research conducted in different geographical and cultural contexts is considered. While such variability is evident, it should not be regarded solely as an intrinsic characteristic of the data but must be systematically quantified. This necessity arises because a portion of this heterogeneity may stem from biases introduced either by differences among the population subgroups studied or by external factors unrelated to the participants, such as variations in the conditions under which the interventions were conducted. If left unaddressed, this heterogeneity could lead to erroneous interpretations of the results and, consequently, to inaccurate conclusions that undermine the validity of the analysis [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Several techniques aim to detect variability among samples and approach the data quality (DQ) of datasets [<xref ref-type="bibr" rid="ref27">27</xref>]. Among them, spatial DQ techniques [<xref ref-type="bibr" rid="ref28">28</xref>] have been developed to evaluate the differences between the probability distribution function from multiple sources, and these techniques have been demonstrated to deal with sets of heterogeneous data, including multivariate and multitype. Additionally, these are valuable tools for dealing with DQ issues, such as missing values among the datasets, which provide metrics that quantify this heterogeneity and outliers.</p>
      <p>Given the above considerations, an exhaustive DQ analysis is needed for several reasons. First, this is key to extracting information about the participants’ characteristic distribution for each pilot site. Second, to examine the differences between these distributions and obtain knowledge about the status of homelessness in different European countries. Finally, these analyses allow us to understand if the information gathered can be used as a different pilot-specific dataset. Thus, this work aims to examine the heterogeneity between the people experiencing homelessness data in 4 different European countries and provide quality metadata while delivering a curated CANCERLESS dataset to extract common knowledge and conclusions.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Dataset Conformation</title>
        <p>Data collection was carried out between June 2022 and November 2023. A total sample of 652 people experiencing homelessness was collected: 142 from Austria, 158 from Greece, 197 from Spain, and 155 from the United Kingdom. Participants were included if they were at least 18 years of age and experiencing homelessness, fitting any classification of the European Typology of Homelessness and Housing Exclusion [<xref ref-type="bibr" rid="ref29">29</xref>]. Participants were excluded if they could not provide informed consent, had difficulties interpreting the aim of the research, did not accept to participate in the study, if they had a known cancer diagnosis or have had cancer previously, and the intervention or study would harm them.</p>
        <p>Data used in this study were collected as part of the CANCERLESS project. The study followed a pre- and postdesign, but in this specific analysis, we present only data collected at baseline (T0), that is, before each individual started the intervention. This approach allows us to see the characteristics of each pilot at the beginning of the intervention and, subsequently, to observe the initial differences that will serve to perform a correct analysis of the data.</p>
        <p>The questionnaires included in the database were the following: EQ-5D-5L to measure self-reported health-related quality of life [<xref ref-type="bibr" rid="ref30">30</xref>], Health Care Empowerment Questionnaire (HCEQ) to assess users’ empowerment related to health care [<xref ref-type="bibr" rid="ref31">31</xref>], Brief Symptom Inventory-18 to measure psychological distress [<xref ref-type="bibr" rid="ref32">32</xref>], and the Person-Centered Coordinated Care Experience Questionnaire to evaluate several domains of person-centered coordinated care from the perspective of the user [<xref ref-type="bibr" rid="ref33">33</xref>]. Additionally, specific-purpose questions were included regarding the following information: sociodemographics, health literacy, active diagnosis, medication taken, risk behaviors, healthy lifestyles, and previous use of health care services. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides the complete list of the T0 questionnaires.</p>
        <p>The T0 questionnaire was administered to all pilot participants. A coordinator at each pilot site recorded the responses. Later, the information was uploaded by the research team of each pilot to a digital platform created by this research consortium called CANCERLESS Interventions Data Management Application, which stores the data in a digital format. This platform also provides feedback to the coordinator through metrics and aggregated information.</p>
      </sec>
      <sec>
        <title>Methods—Data Quality Workflow</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> shows the methodology followed in this study. The workflow is divided into 2 blocks for assessing the intersite coherence, one across the information captured in the questionnaires and the other across their completeness patterns. The main difference lies in the preprocessing step: for the questionnaire, imputation is performed, whereas for completeness, a matrix of fault categories is used. Subsequently, a dimensional reduction technique was applied according to the analysis performed—see the specific details in the following subsections. The following steps were common to both analyses: calculating outlier filtering, histogram application to represent the probability density function of the dataset, followed by flattening, normalization, and column stacking, to be used as input for the information theory–based DQ metrics. The technique for evaluating DQ and response variability across the pilot studies involved transforming each dataset into a probability distribution, then applying comparative metrics to measure similarity and identify missing information and therefore the level of nonoverlapping between them. The technique relies on the calculus of a simplex, multidimensional generalization of a triangle, conserving the intersite dissimilarity where the centroid represents an informed average distribution of the sources. Subsequently, 2 metrics were computed, constrained to the Jensen-Shannon distance: the source probabilistic outlyingness (SPO), measuring the dissimilarity of each source to the average distribution; and the global probabilistic deviation (GPD), gauging the degree of global variability among the sources [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The derived metrics, that is, GPD and SPO, are bounded between 0 and 1, so 0 means equal distributions and 1 means nonoverlapping. For the SPO, a value of 0 denotes the closest possible approach to the centroid, while for the GPD, it indicates the least data variability. Finally, visual plots of these metrics are shown to compare the variability results in a visual form between the different pilots. All these steps were later used to extract GPD, SPO, and multisource variability (MSV) for the global dataset and each section inside the questionnaire.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of the methodology to obtain data quality metrics for the CANCERLESS dataset. Two types of analysis are conducted, with shared steps. For the complete dataset, missing values are imputed using iterative imputation techniques. In the missing data analysis, a matrix is built with values indicating 0=ordinary, 1=dependent, or 2=nonmissing. Dimensionality reduction is applied: PCA for complete data and MCA for missing data. After preprocessing, histograms for each country are normalized and combined to calculate distances from the centroid, yielding global probabilistic deviation, source probabilistic outlyingness, and multisource variability values. For specific dataset sections, the same process is applied to each subset. MCA: multiple correspondence analysis; PCA: principal component analysis.</p>
          </caption>
          <graphic xlink:href="medinform_v13i1e73596_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Questionnaire Information</title>
        <p>This approach has been used following a top-down methodology analyzing multivariate to univariate data, that is, to compare the whole T0 questionnaire and its sections. We excluded textual and multiple-choice options from the analysis since there was a high number of missing data and a much smaller number of category selections per question than the total number of choices, implying minimal variability with no final effect on the analysis. First, we preprocessed the data to transform categorical text into numerical variables along with an iterative imputation method [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. This method performs multivariate imputation through chained equations. Initially, all missing values are filled with simple univariate estimates (eg, the feature’s mean). Thereafter, each incomplete variable is regressed on the other features using a Bayesian ridge estimator to predict its missing entries. Predicted values replace the initial estimates, and this process cycles through all variables for a predefined number of iterations or until convergence of the imputed values is reached.</p>
        <p>Subsequently, to obtain a multivariate representation, we applied principal component analysis (PCA) [<xref ref-type="bibr" rid="ref38">38</xref>] to reduce the dimensionality of the original 130-variable space to 3 dimensions and select the top 20 variables with the highest explained variance. Following this, we segregated the data by pilot source and conducted outlier filtering using the local outlier factor method [<xref ref-type="bibr" rid="ref39">39</xref>], removing outliers specific to each pilot site. Finally, we computed a 3D histogram for each pilot, using 10 bins for each dimension, which were then used as the input in the method.</p>
      </sec>
      <sec>
        <title>Completeness Patterns</title>
        <p>Regarding the comparison of patterns related to blank responses or missing data, the T0 questionnaire comprises questions with varying levels of branching—specific queries are intended to be answered only if certain conditions from prior responses are met (eg, the question about the number of cigarettes smoked daily is only relevant if the participant declares themselves as a smoker in the preceding questions). Consequently, we distinguished between “not applicable missing” and ordinary missing data, which was applied using a predefined rule set. Once the rule was defined, it was applied to the dataset, obtaining a missing matrix and transforming the values into one of these categories. After the transformation, we applied the multiple correspondence analysis (MCA) [<xref ref-type="bibr" rid="ref40">40</xref>] technique to reduce the dimensionality of the data and select the top 20 variables with the highest explained variance, thus identifying the most influential questionnaires since MCA is a specific technique to reduce dimensionality for categorical values. Next, the local outlier factor methodology was applied to remove outliers over the data on the reduced space. Finally, the multidimensional histogram that was flattened and normalized to be used as GPD’s input was created.</p>
      </sec>
      <sec>
        <title>Exploratory Analyses</title>
        <p>The exploratory analyses of the study are presented using the following methods. First, biplots with 2 dimensions are generated after the original data undergo dimensionality reduction either using PCA or MCA. Additionally, the GDP methodology incorporates the MSV plot [<xref ref-type="bibr" rid="ref35">35</xref>], where the 2 or 3 components with the highest variances are projected using multidimensional scaling. In the MSV plot, sources are represented as circles or spheres, and the distance between them indicates the distance between their distributions, based on the Jensen-Shannon distance, with the circle’s radius representing the number of cases.</p>
        <p>To conduct this analysis, we used the Python 3 programming language [<xref ref-type="bibr" rid="ref41">41</xref>] and the NumPy, pandas, scikit-learn, and prince libraries [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. The experimentation notebooks, including a Python version of the MSV metrics and visualizations, are available on GitHub [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The study was approved by the ethics committee of the Medical University of Vienna (1702/2021), which served as the lead ethics committee for the project. Additionally, each pilot site in the 4 countries secured approval from their respective ethical review boards or institutions before commencing data collection, and Universitat Politècnica de València also obtained approval from an ethics committee, specifically for the management of participants’ personal data. Prior to conducting any data collection, participants were given an information leaflet detailing the study’s purpose and were allowed to ask questions to help them decide on their participation. It was emphasized to all participants that their involvement was entirely voluntary, and they could opt out of answering any questions that made them uncomfortable. Participants were explicitly reassured that declining participation would not negatively impact their access to health and social care services. Informed consent was obtained from all participants through signed forms, which were also verbally confirmed at the beginning of the data collection sessions. All collected data have been securely stored in accordance with data protection regulations. CANCERLESS Interventions Data Management Application platform securely stores data in agreement with the General Data Protection Regulation, following strict guidelines for collecting, processing, storing, and transferring personal data in the European Union and the European Economic Area. Participants did not receive any financial compensation for taking part in the project.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>Data used in this study comprehend the whole T0 set of responses, whose demographic distribution is presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Demographic distribution among the different pilots.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="160"/>
            <col width="110"/>
            <col width="130"/>
            <col width="110"/>
            <col width="110"/>
            <col width="130"/>
            <col width="100"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Pilot</td>
                <td>Values, n (%)</td>
                <td>Age (years), mean (SD)</td>
                <td>Male, n (%)</td>
                <td>Female, n (%)</td>
                <td>Nonbinary, n (%)</td>
                <td>Other, n (%)</td>
                <td>Do not want to disclose sex, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Austria</td>
                <td>142 (21.8)</td>
                <td>45.28 (12.83)</td>
                <td>60 (42.3)</td>
                <td>82 (57.7)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>Greece</td>
                <td>158 (24.2)</td>
                <td>51.57 (13.53)</td>
                <td>121 (76.6)</td>
                <td>34 (21.5)</td>
                <td>0 (0)</td>
                <td>2 (1.3)</td>
                <td>1 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>Spain</td>
                <td>198 (30.3)</td>
                <td>48.94 (14.82)</td>
                <td>110 (55.6)</td>
                <td>87 (43.9)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>United Kingdom</td>
                <td>155 (23.8)</td>
                <td>42.91 (12.04)</td>
                <td>127 (81.9)</td>
                <td>27 (17.4)</td>
                <td>1 (0.6)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>652 (100)</td>
                <td>47.87 (13.06)</td>
                <td>418 (64.1)</td>
                <td>230 (35.3)</td>
                <td>1 (0.2)</td>
                <td>2 (0.3)</td>
                <td>1 (0.2)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Questionnaire Data Analysis</title>
        <p>The left side of <xref rid="figure2" ref-type="fig">Figure 2</xref> shows the scatter plot of the 2 first PCA components of the complete dataset for the entire questionnaire. The UK pilot shows a larger variance in comparison to the others. In addition, substantial differences in position and sparsity can be appreciated between the different pilot sites. The PCA loadings in the figure show the most critical variables that have influenced the PCA, which are divided into sections. The HCEQ, which is the one with the greatest dispersion, is also the most influential, as it is the questionnaire with the highest contribution to the PCA with questions Q89, Q90, Q92, Q94, Q96, Q97, Q98, Q99, Q100, Q103, Q104, Q105, Q106, Q107, and Q10, followed by the interpersonal communication questionnaire with Q134 and Q136, afterward use of health care services with Q168, quality of life with Q88, and psychological distress with Q73. Table S1 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> provides detailed information regarding the questions corresponding to the selected numbering.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Scatter plot of data along the 2 principal components elicited from the principal component analysis and the multiple correspondence analysis, respectively. Each point is colorized depending on its pilot precedence. Most contributed questions for the principal component analysis calculation have been shown with arrows, depending on the questionnaire they belong to. Tables S1 and S2 in Multimedia Appendix 2 present a detailed table of both, indicating the specific questions and their associated questionnaires. For the global analysis, the principal component analysis indicates a central point where most of the samples are concentrated, with the UK pilot showing the greatest dispersion relative to the others. There is a substantial difference between the UK and Spanish pilot samples. In contrast, Austria and Greece pilots show a wider distribution of their samples. In the completeness case, the figure clearly shows 2 different parts, being the pilots from the United Kingdom, Greece, and Austria quite similar compared to Spain, where it presents an entirely different type of missing from the other pilots, being interpersonal communication and use of health care services sections the most relevant in the calculation of the multiple correspondence analysis. Q: question.</p>
          </caption>
          <graphic xlink:href="medinform_v13i1e73596_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The left side of <xref rid="figure3" ref-type="fig">Figure 3</xref> shows the resultant DQ metrics, which generally present a wide dispersion between pilots for the overall questionnaire and most of the questionnaires. Noteworthy, the health data questionnaire shows metrics less than 0.5 observed, in contrast to those in the other questionnaires with values exceeding 0.8, indicating a clear difference for each pilot. For health care services, interpersonal communication, and health care empowerment, the GPD value exceeds 0.9, highlighting the divergence shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. However, several imputations have been performed for the case of Spain in the interpersonal communication and use of health care services sections.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Results from the GDP and SPO multicentric analysis were applied to both the complete dataset (left side) and the completeness (right side) from the dataset composed of the T0 interviews in Austria, Greece, Spain, and the United Kingdom. The SPO indicates the distance of that pilot from the latent central tendency; the GPD can be understood as the mean of the variability of each pilot; a value close to 0 means less variability. In our case, a value of 0 indicates no missings for these questionnaires. Generally, a large variability is observed, especially in the Spanish pilot. GPD: global probabilistic deviation; SPO: source probabilistic outlyingness.</p>
          </caption>
          <graphic xlink:href="medinform_v13i1e73596_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The overall analysis of the questionnaire reveals 3 types of variability patterns. First, we found questionnaires with very different distributions between pilots. Still, there are no decisive questions within the questionnaire, as they do not appear on the left side of <xref rid="figure2" ref-type="fig">Figure 2</xref> as the most relevant in the PCA, such as sociodemographic data, health literacy, and risk behaviors and healthy lifestyles. Second, questions related to health data showed fewer differences concerning the pilots compared to the other questionnaires, which had a GPD of 0.452. Finally, questionnaires such as psychological distress, quality of life, HCEQ, interpersonal communication (Person-Centered Coordinated Care Experience Questionnaire), and the items related to the use of health care services, apart from diverging between the different pilots according to the metrics applied, present some questions that are determinant and differentiable by country.</p>
      </sec>
      <sec>
        <title>Missing Patterns Analysis</title>
        <p>From the 652 participants analyzed and the 130 questions collected at T0, a total of 84,760 values were obtained. Of these, 70,384 of 84,760 (83%) values are complete and valid, 6260 of 84,760 (7.4%) values are not applicable missing, and 8116 of 84,760 (9.6%) values are ordinary missing.</p>
        <p>The right side of <xref rid="figure2" ref-type="fig">Figure 2</xref> shows the MCA projection of the missing profiles to 2 dimensions, where a cluster of Austria, Greece, and the United Kingdom can be observed at the top-left side of the plot. Mainly, Spain samples can be observed at the bottom-right of the figure, denoting that Spain is very different from the other sites in terms of the missing pattern. In this instance, the questionnaire with the highest number of questions was the use of health care services, comprising Q155, Q158, Q167, Q161, Q152, Q180, Q176, Q179, and Q178. This was followed by the interpersonal communication questionnaire, which included Q138, Q142, Q140, Q136, and Q134. Next was risk behaviors and healthy lifestyle, encompassing Q45, Q46, Q44, and Q59, and quality of life with Q88. Table S2 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> provides detailed information regarding the questions corresponding to the selected numbering.</p>
        <p>The right side of Figure 3 offers both a global and section-by-section view of missing-data behavior after applying the GPD and SPO metrics. Overall variability is high; yet, 3 distinct patterns emerge. First, several sections—health literacy, health data, psychological distress, and health care empowerment—show virtually no disparity across pilots because they contain no missing values, so their GPD and SPO scores sit near 0. Second, marked differences appear in sociodemographic data, risk behaviors, healthy lifestyles, and use of health care services, where some pilots contribute many missings, while others contribute few.  Third, a distinct Spain-specific pattern emerges. Spain is the only pilot exhibiting substantial variability that elevates the mean GPD in sections where the remaining pilots show minimal variability—particularly in quality of life (Spain: 100/1576, 6.3% missing; others combined: 10/3640, 0.3% missing) and in interpersonal communication, where the SPO profile departs markedly from the consistently low missingness observed elsewhere.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Summary of Main Findings</title>
        <p>This study investigated heterogeneity among people experiencing homelessness in 4 European countries and evaluated the quality of data collected in a multicenter cohort. Understanding variability in demographics, health status, and service use is essential for designing interventions tailored to this population’s needs. The analysis showed pronounced between-pilot differences: for most questionnaires, the GPD exceeded 0.7 at both pilot and aggregate levels (Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>), indicating substantial heterogeneity. The sole exception was the health questionnaire, whose lower GPD likely reflects that only a single quantitative item remained after discarding multichoice and free-text responses. Missing-data diagnostics revealed further site-specific discrepancies, with the Spanish cohort diverging most markedly, particularly in the use of health services, quality of life, and interpersonal communication (Figures 2 and 3).</p>
        <p>Participants’ responses reveal notable differences in the experiences of people experiencing homelessness across the various countries. While the heterogeneity observed within the homeless population can, in part, be attributed to country-specific factors, such as distinct socioeconomic and health care contexts, variations in responses may also stem from differences in the implementation of interventions and the subjective perceptions of individual participants. These discrepancies are particularly evident in key areas assessed by the PCA, including health-related domains, where divergent patterns emerge based on both contextual and personal factors. In the case of Q136: “Do you have a care plan (or a single plan of care) that takes into account all your health and wellbeing needs?” Spain stands out as the only country, where more individuals have health plans than those without. Additionally, Austria is unique in having no instances of “I don’t know” responses to this question. For Q134: “Do you have a single professional (or several professionals) who takes responsibility for coordinating your care across the services that you use?” Spain and the United Kingdom are distinguished by having more positive responses than negative ones. Notably, the United Kingdom records the highest number of participants uncertain about their answers. Furthermore, Spain shows a substantially higher number of blank responses for both Q136 and Q134. Meanwhile, concerning 3 questions belonging to the HCEQ subquestionnaire: Q104: “During the last 6 months, how important is it that you obtained all the information you wanted?” Q106: “During the last 6 months, how important is it that you and your loved ones decide the need for the health care and services?” and Q108: “During the last 6 months, how important is it that you and your loved ones decide the amount of health care and services?” In general terms, both in the United Kingdom and Austria, the response rate is higher than in Spain and Greece. Meanwhile, the United Kingdom and Austria maintain the same number of answers for these questions, with the UK participants being the most important for all 3 questions and the Austrian participants the second most important. We see how, in the case of Greek cities and Spain, the difference lies in the type of question; in the case of Q106, the Greek cities considered it very unimportant, while the participants in the Spanish pilot considered it the most important of the 3. However, the opposite effect was observed in the case of Q104 and Q108. Finally, for Q88: “We would like to know how good or bad your health is today. 100 means the best health you can imagine. 0 means the worst health you can imagine.” being the perceived health status is a major patient-reported experience measure of the study.</p>
      </sec>
      <sec>
        <title>Significance</title>
        <p>This study, as far as the authors know, is the first study confirming the heterogeneity within the group of people experiencing homelessness in a European multicenter study, as most of the previous studies have been primarily focused on the US-American context [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. The study’s results enable quantifying this heterogeneity between the different pilots that conform to the database through various factors that should be considered in a posteriori analysis. First, despite heterogeneity, the only set of items that can be assumed to be the most appropriate if a global analysis is desired is the health data questions since they do not present any missings, as are the ones with the least variability between pilots. Second, in the case of interpersonal communication and use of health care services, the global result could not be correctly determined since most of the data were imputed in the case of Spain, which does not make the analysis at a global level appropriate. Finally, the analyses at the section level should be done separately for each pilot, with the HCEQ being the most relevant since it presents greater variability between pilots and does not contain missing values. Therefore, the analysis of the pilots must be carried out independently, and the conclusions of one pilot cannot be extrapolated to the others, given the great divergence found between them. The disparities in the global dataset are more pronounced for Spain. In contrast to the other pilots, the methodology shows that ordinary missing values constitute the majority, especially within the interpersonal communication and health care utilization questionnaires.</p>
        <p>In this context, it is important to recognize that eliciting such variation, whether through the proposed methodology or other approaches, is not necessarily a DQ issue. Rather, it is an expected step for adapting the interventions to the specific socioeconomic and health care contexts. However, the nature and source of this variation should be carefully considered, as concerns may arise if the variation is driven by systematic measurement error or bias, which could influence the validity of the findings and the effectiveness of the interventions. This proposed methodology can help to find such variation prior to any analysis and therefore approach it, considering the characteristics of the dataset under study.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Including this methodology to analyze the data enables us to demonstrate 3 objectives that help ensure DQ for improved analysis. First, our approach allows us to evaluate the variability existing in the data, especially the differences between the data from different sources from a more visual perspective and with a single iteration, considering all types of variables for the analysis, without going into detail in classical tests that are more sensitive to the analysis. The technique used for DQ of the responses in the different pilots and to evaluate their quality in terms of missing information makes use of the comparative datasets, transforming them into probability distributions that allow using comparative metrics of similarity and, therefore, the level of nonoverlapping between them. Thus, it is necessary to know the boundaries regarding the exploitation capacity of the dataset for prospective uses, especially with the scarcity of homelessness quantitative information. Second, this hierarchical approach allows for monitoring the pilots’ progress and comparing them as a whole and by different sections. As data become available, we can promptly detect and correct deviations from the established methodology or protocol. This approach also enables the systematic identification of patterns and causes of missing data, supports the implementation of targeted corrective measures, and—by embedding these methods in a control framework—drives continuous improvement in information quality. Third, further analyses of DQ with new data or batches can be applied thanks to the replicability of the methodology, given that the source code has been made public.</p>
        <p>The analysis of the overall results is affected by the large number of missing values in the Spain dataset. Since there are many questions with missing data, an imputation had to be performed, which negatively influenced the results. In addition, the number of samples is not very high for our applied method, which may also impact the results. This is because the methodology used is sensitive and requires a large amount of data to generalize results more accurately. Missing values were imputed with reference to the pooled empirical distribution of all pilot sites. While this cross-site approach may introduce some location-specific bias, it enhances methodological robustness by preserving the overall variance structure; this was exemplified in the Spanish cohort, where the 2-part analysis coupled with the imputation procedure successfully pinpointed the sources of variability.</p>
      </sec>
      <sec>
        <title>Future Perspectives</title>
        <p>For all of those reasons, the results of this study will facilitate prospective dataset DQ labeling for prospective publication in related health data access bodies in the framework of the European Union’s European Health Data Space (EHDS) initiative [<xref ref-type="bibr" rid="ref48">48</xref>] in compliance with Article 78 on DQ that will allow secondary use of health data for research, innovation, and policymaking under conditions of security and privacy by ensuring a certain level of DQ that will enable users to know in advance the characteristics of the CANCERLESS dataset thanks to the applied methodology.</p>
        <p>Following current best-practice guidance on dataset curation, other DQ dimensions not covered in this study—such as temporal coherence, consistency, or correctness—will be assessed as part of the mid-scale pilot of the EHDS project QUANTUM (“Quality, Utility and Maturity Measured”). QUANTUM will pilot an European Union–wide framework for rating both the intrinsic quality of health datasets and the maturity of their curation processes; CANCERLESS database will conform to one of these analyses, supporting our analysis and getting externally validated, a multidimensional appraisal that complements this analysis.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The analysis of this multicenter sample of people experiencing homelessness from 4 different European countries revealed substantial heterogeneity between sites of special importance for health care empowerment, quality of life, and interpersonal communication values, which showed the most differences between pilots. Particularly, differences in missingness patterns in data were larger than the ones found on the raw data, especially for the Spain pilot, highlighting that the interpersonal communication, health care empowerment, and use of health services data present a high number of nulls and should not be used for analysis. Further qualitative techniques are needed to understand the cause of this deviation from the other pilots. This methodology should be applied to multicentric data to monitor a pilot as the data become available and, therefore, amend possible protocol deviations. In summary, as quantitative data about homelessness are scarce, using a DQ-validated dataset in the context of the EHDS is crucial to ensure the reliable use of data to facilitate research on vulnerable populations such as people experiencing homelessness.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>T0 questionnaire.</p>
        <media xlink:href="medinform_v13i1e73596_app1.docx" xlink:title="DOCX File , 171 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Most principal component analysis and multiple correspondence analysis relevant questions.</p>
        <media xlink:href="medinform_v13i1e73596_app2.docx" xlink:title="DOCX File , 115 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Multiple correspondence analysis metrics for CANCERLESS dataset.</p>
        <media xlink:href="medinform_v13i1e73596_app3.docx" xlink:title="DOCX File , 247 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DQ</term>
          <def>
            <p>data quality</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHDS</term>
          <def>
            <p>European Health Data Space</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">GPD</term>
          <def>
            <p>global probabilistic deviation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HCEQ</term>
          <def>
            <p>Health Care Empowerment Questionnaire</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MCA</term>
          <def>
            <p>multiple correspondence analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MSV</term>
          <def>
            <p>multisource variability</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PCA</term>
          <def>
            <p>principal component analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SPO</term>
          <def>
            <p>source probabilistic outlyingness</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The CANCERLESS project has been funded by the European Commission’s Programme Horizon 2020 (grant agreement 965351). This publication reflects the author’s views. The European Commission is not responsible for any use that may be made of the information it contains. The study is partly funded through the QUANTUM project HORIZON-HLTH-2023-TOOL-05-09—Developing a Data Quality and Utility Label for the European Health Data Space (grant agreement 101137057).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fragner</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Belogianni</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Grabovac</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Cancer care in people experiencing homelessness: identifying key issues, challenges, and facilitators</article-title>
          <source>Br J Gen Pract</source>
          <year>2024</year>
          <volume>74</volume>
          <issue>745</issue>
          <fpage>342</fpage>
          <lpage>343</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bjgp.org/lookup/pmidlookup?view=long&amp;pmid=39054087"/>
          </comment>
          <pub-id pub-id-type="doi">10.3399/bjgp24X738801</pub-id>
          <pub-id pub-id-type="medline">39054087</pub-id>
          <pub-id pub-id-type="pii">74/745/342</pub-id>
          <pub-id pub-id-type="pmcid">PMC11299681</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Somerville</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Understanding homelessness</article-title>
          <source>Hous Theory Soc</source>
          <year>2013</year>
          <volume>30</volume>
          <issue>4</issue>
          <fpage>384</fpage>
          <lpage>415</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/14036096.2012.756096"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/14036096.2012.756096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Toro</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Toward an international understanding of homelessness</article-title>
          <source>J Soc Issues</source>
          <year>2007</year>
          <volume>63</volume>
          <issue>3</issue>
          <fpage>461</fpage>
          <lpage>481</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/j.1540-4560.2007.00519.x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1540-4560.2007.00519.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nilsson</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Nordentoft</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hjorthøj</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Individual-level predictors for becoming homeless and exiting homelessness: a systematic review and meta-analysis</article-title>
          <source>J Urban Health</source>
          <year>2019</year>
          <volume>96</volume>
          <issue>5</issue>
          <fpage>741</fpage>
          <lpage>750</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31388823"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11524-019-00377-x</pub-id>
          <pub-id pub-id-type="medline">31388823</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11524-019-00377-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6814700</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Warburton</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Papic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Whittaker</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Heterogeneity among homeless Australian women and their reasons for homelessness entry</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2022</year>
          <volume>19</volume>
          <issue>15</issue>
          <fpage>8909</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph19158909"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph19158909</pub-id>
          <pub-id pub-id-type="medline">35897280</pub-id>
          <pub-id pub-id-type="pii">ijerph19158909</pub-id>
          <pub-id pub-id-type="pmcid">PMC9331468</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alexiev</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Eighth overview of housing exclusion in Europe</article-title>
          <source>Florent Houdmon (City of Marseille, France)</source>
          <year>2023</year>
          <access-date>2025-10-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.feantsa.org/public/user/Resources/reports/2023/OVERVIEW/Rapport_EN.pdf">https://www.feantsa.org/public/user/Resources/reports/2023/OVERVIEW/Rapport_EN.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Funk</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Dill</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Valvassori</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The impact of homelessness on mortality of individuals living in the United States: a systematic review of the literature</article-title>
          <source>J Health Care Poor Underserved</source>
          <year>2022</year>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>457</fpage>
          <lpage>477</lpage>
          <pub-id pub-id-type="doi">10.1353/hpu.2022.0035</pub-id>
          <pub-id pub-id-type="medline">35153234</pub-id>
          <pub-id pub-id-type="pii">S1548686922100355</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Perera</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davachi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Cardiovascular disease risk among the poor and homeless—what we know so far</article-title>
          <source>Curr Cardiol Rev</source>
          <year>2009</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>69</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20066152"/>
          </comment>
          <pub-id pub-id-type="doi">10.2174/157340309787048086</pub-id>
          <pub-id pub-id-type="medline">20066152</pub-id>
          <pub-id pub-id-type="pmcid">PMC2803292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carmichael</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schiffler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Moudatsou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tabaki</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Doñate-Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alhambra-Borrás</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kouvari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Karnaki</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gil-Salmeron</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grabovac</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Barriers and facilitators to health care access for people experiencing homelessness in four European countries: an exploratory qualitative study</article-title>
          <source>Int J Equity Health</source>
          <year>2023</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>206</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://equityhealthj.biomedcentral.com/articles/10.1186/s12939-023-02011-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12939-023-02011-4</pub-id>
          <pub-id pub-id-type="medline">37803317</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12939-023-02011-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC10559410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeleff</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haider</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schiffler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gil-Salmerón</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Barreto Schuch</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Grabovac</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Cancer risk factors and access to cancer prevention services for people experiencing homelessness</article-title>
          <source>Lancet Public Health</source>
          <year>2024</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e128</fpage>
          <lpage>e146</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2468-2667(23)00298-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2468-2667(23)00298-0</pub-id>
          <pub-id pub-id-type="medline">38307679</pub-id>
          <pub-id pub-id-type="pii">S2468-2667(23)00298-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aldridge</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Menezes</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lewer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cornes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Blackburn</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Byng</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Denaxas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fuller</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hewett</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kilmister</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Luchenski</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Manthorpe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McKee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Neale</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Story</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tinelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Whiteford</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wurie</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hayward</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Causes of death among homeless people: a population-based cross-sectional study of linked hospitalisation and mortality data in England</article-title>
          <source>Wellcome Open Res</source>
          <year>2019</year>
          <volume>4</volume>
          <fpage>49</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30984881"/>
          </comment>
          <pub-id pub-id-type="doi">10.12688/wellcomeopenres.15151.1</pub-id>
          <pub-id pub-id-type="medline">30984881</pub-id>
          <pub-id pub-id-type="pmcid">PMC6449792</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lawrie</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Charow</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Giuliani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Papadakos</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Homelessness, cancer and health literacy: a scoping review</article-title>
          <source>J Health Care Poor Underserved</source>
          <year>2020</year>
          <volume>31</volume>
          <issue>1</issue>
          <fpage>81</fpage>
          <lpage>104</lpage>
          <pub-id pub-id-type="doi">10.1353/hpu.2020.0010</pub-id>
          <pub-id pub-id-type="medline">32037319</pub-id>
          <pub-id pub-id-type="pii">S154868692010010X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schiffler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Carmichael</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Doñate-Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alhambra-Borrás</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Varadé</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Barrio Cortes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kouvari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Karnaki</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moudatsou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tabaki</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gil-Salmeron</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grabovac</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Access to cancer preventive care and program considerations for people experiencing homelessness across four European countries: an exploratory qualitative study</article-title>
          <source>EClinicalMedicine</source>
          <year>2023</year>
          <volume>62</volume>
          <fpage>102095</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-5370(23)00272-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.eclinm.2023.102095</pub-id>
          <pub-id pub-id-type="medline">37533422</pub-id>
          <pub-id pub-id-type="pii">S2589-5370(23)00272-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC10393536</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carmichael</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aldasoro</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gil Salmerón</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alhambra-Borrás</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Doñate-Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Seiler-Ramadas</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Grabovac</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Exploring the application of the navigation model with people experiencing homelessness: a scoping review</article-title>
          <source>J Soc Distress Homeless</source>
          <year>2022</year>
          <volume>32</volume>
          <issue>2</issue>
          <fpage>352</fpage>
          <lpage>366</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/10530789.2021.2021363"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10530789.2021.2021363</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baggett</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Barbosa Teixeira</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Anandakugan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sporn</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Percac-Lima</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Rigotti</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Patient navigation to promote lung cancer screening in a community health center for people experiencing homelessness: protocol for a pragmatic randomized controlled trial</article-title>
          <source>Contemp Clin Trials</source>
          <year>2022</year>
          <volume>113</volume>
          <fpage>106666</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cct.2021.106666</pub-id>
          <pub-id pub-id-type="medline">34971796</pub-id>
          <pub-id pub-id-type="pii">S1551-7144(21)00402-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Trevors Babici</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tedesco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Spaner</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Morey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dosani</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Assessing the impact of a health navigator on improving access to care and addressing the social needs of palliative care patients experiencing homelessness: a service evaluation</article-title>
          <source>Palliat Med</source>
          <year>2023</year>
          <volume>37</volume>
          <issue>4</issue>
          <fpage>646</fpage>
          <lpage>651</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/02692163221146812?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/02692163221146812</pub-id>
          <pub-id pub-id-type="medline">36576315</pub-id>
          <pub-id pub-id-type="pmcid">PMC10074742</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kline</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Rocque</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Rohan</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Blackley</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Cantril</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt-Chapman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Burris</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Shulman</surname>
              <given-names>LN</given-names>
            </name>
          </person-group>
          <article-title>Patient navigation in cancer: the business case to support clinical needs</article-title>
          <source>J Oncol Pract</source>
          <year>2019</year>
          <volume>15</volume>
          <issue>11</issue>
          <fpage>585</fpage>
          <lpage>590</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31509483"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/JOP.19.00230</pub-id>
          <pub-id pub-id-type="medline">31509483</pub-id>
          <pub-id pub-id-type="pmcid">PMC8790714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>WHO guidelines on hand hygiene in health care</article-title>
          <source>World Health Organization</source>
          <year>2010</year>
          <access-date>2025-10-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/publications/i/item/9789241597906">https://www.who.int/publications/i/item/9789241597906</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Te Boveldt</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vernooij-Dassen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leppink</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Samwel</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Vissers</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Engels</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Patient empowerment in cancer pain management: an integrative literature review</article-title>
          <source>Psychooncology</source>
          <year>2014</year>
          <volume>23</volume>
          <issue>11</issue>
          <fpage>1203</fpage>
          <lpage>1211</lpage>
          <pub-id pub-id-type="doi">10.1002/pon.3573</pub-id>
          <pub-id pub-id-type="medline">24816749</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gianfrancesco</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Tamang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yazdany</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmajuk</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Potential biases in machine learning algorithms using electronic health record data</article-title>
          <source>JAMA Intern Med</source>
          <year>2018</year>
          <volume>178</volume>
          <issue>11</issue>
          <fpage>1544</fpage>
          <lpage>1547</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30128552"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2018.3763</pub-id>
          <pub-id pub-id-type="medline">30128552</pub-id>
          <pub-id pub-id-type="pii">2697394</pub-id>
          <pub-id pub-id-type="pmcid">PMC6347576</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Comparative study of probability distribution distances to define a metric for the stability of multi-source biomedical research data</article-title>
          <year>2013</year>
          <conf-name>35th Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</conf-name>
          <conf-date>July 3-7, 2013</conf-date>
          <conf-loc>Osaka, Japan</conf-loc>
          <fpage>3226</fpage>
          <lpage>3229</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/EMBC.2013.6610228"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/embc.2013.6610228</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peressini</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Pathways into homelessness: testing the heterogeneity hypothesis</article-title>
          <source>Finding Home Policy Options for Addressing Homelessness in Canada</source>
          <year>2009</year>
          <publisher-loc>Toronto, Ontario</publisher-loc>
          <publisher-name>University of Toronto</publisher-name>
          <fpage>1</fpage>
          <lpage>17</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenheck</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bassuk</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Salomon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Special populations of homeless Americans</article-title>
          <source>Practical Lessons from the 1998 National Symposium on Homeless Research</source>
          <year>1999</year>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>US Department of Health and Human Services</publisher-name>
          <fpage>1</fpage>
          <lpage>27</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in medicine</article-title>
          <source>N Engl J Med</source>
          <year>2019</year>
          <volume>380</volume>
          <issue>14</issue>
          <fpage>1347</fpage>
          <lpage>1358</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMra1814259</pub-id>
          <pub-id pub-id-type="medline">30943338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Suleyman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Key challenges for delivering clinical impact with artificial intelligence</article-title>
          <source>BMC Med</source>
          <year>2019</year>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>195</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-019-1426-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-019-1426-2</pub-id>
          <pub-id pub-id-type="medline">31665002</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-019-1426-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6821018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Romero</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Conejero</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Potential limitations in COVID-19 machine learning due to data source variability: a case study in the nCov2019 dataset</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>2</issue>
          <fpage>360</fpage>
          <lpage>364</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://riunet.upv.es/handle/10251/189724"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa258</pub-id>
          <pub-id pub-id-type="medline">33027509</pub-id>
          <pub-id pub-id-type="pii">5919075</pub-id>
          <pub-id pub-id-type="pmcid">PMC7797735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Souza</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Johnata</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ismael</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>João</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mariana</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Andreia</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>João</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Measuring  variability in acute myocardial infarction coding using a statistical process control and probabilistic temporal data quality control approaches</article-title>
          <year>2021</year>
          <conf-name>Trends and Applications in Information Systems and Technologies (WorldCIST 2021)</conf-name>
          <conf-date>April 30, 2021</conf-date>
          <conf-loc>Azores, Portugal</conf-loc>
          <fpage>193</fpage>
          <lpage>202</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-72651-5_19</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Miranda</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Organizing data quality assessment of shifting biomedical data</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2012</year>
          <month>8</month>
          <volume>180</volume>
          <fpage>721</fpage>
          <lpage>725</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/230637487_Organizing_data_quality_assessment_of_shifting_biomedical_data"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/978-1-61499-101-4-721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edgar</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The ETHOS definition and classification of homelessness and housing exclusion</article-title>
          <source>Eur J Homelessness</source>
          <year>2012</year>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>219</fpage>
          <lpage>225</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.feantsaresearch.org/download/ejh6_2_resp_ethosdef14957038748931638958.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>EuroQol Group</collab>
          </person-group>
          <article-title>EuroQol—a new facility for the measurement of health-related quality of life</article-title>
          <source>Health Policy</source>
          <year>1990</year>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>199</fpage>
          <lpage>208</lpage>
          <pub-id pub-id-type="doi">10.1016/0168-8510(90)90421-9</pub-id>
          <pub-id pub-id-type="medline">10109801</pub-id>
          <pub-id pub-id-type="pii">0168-8510(90)90421-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gagnon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hibert</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubé</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dubois</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of an instrument measuring individual empowerment in relation to personal health care: the Health Care Empowerment Questionnaire (HCEQ)</article-title>
          <source>Am J Health Promot</source>
          <year>2006</year>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>429</fpage>
          <lpage>435</lpage>
          <pub-id pub-id-type="doi">10.4278/0890-1171-20.6.429</pub-id>
          <pub-id pub-id-type="medline">16871823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Derogatis</surname>
              <given-names>LR</given-names>
            </name>
          </person-group>
          <source>Brief Symptom Inventory 18</source>
          <year>2001</year>
          <publisher-loc>Baltimore, MD</publisher-loc>
          <publisher-name>Johns Hopkins University</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lloyd</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fosh</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Whalley</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Byng</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Close</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Validation of the person-centred coordinated care experience questionnaire (P3CEQ)</article-title>
          <source>Int J Qual Health Care</source>
          <year>2019</year>
          <volume>31</volume>
          <issue>7</issue>
          <fpage>506</fpage>
          <lpage>512</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30508089"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/intqhc/mzy212</pub-id>
          <pub-id pub-id-type="medline">30508089</pub-id>
          <pub-id pub-id-type="pii">5225143</pub-id>
          <pub-id pub-id-type="pmcid">PMC6839368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Stability metrics for multi-source biomedical data based on simplicial projections from probability distribution distances</article-title>
          <source>Stat Methods Med Res</source>
          <year>2017</year>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>312</fpage>
          <lpage>336</lpage>
          <pub-id pub-id-type="doi">10.1177/0962280214545122</pub-id>
          <pub-id pub-id-type="medline">25091808</pub-id>
          <pub-id pub-id-type="pii">0962280214545122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zurriaga</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-Panadés</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Melchor</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Applying probabilistic temporal and multisite data quality control methods to a public health mortality registry in Spain: a systematic approach to quality control of repositories</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>1085</fpage>
          <lpage>1095</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://riunet.upv.es/handle/10251/80897"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocw010</pub-id>
          <pub-id pub-id-type="medline">27107447</pub-id>
          <pub-id pub-id-type="pii">ocw010</pub-id>
          <pub-id pub-id-type="pmcid">PMC11741068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Buuren</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Groothuis-Oudshoorn</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>mice: multivariate imputation by chained equations in R</article-title>
          <source>J Stat Softw</source>
          <year>2011</year>
          <volume>45</volume>
          <fpage>1</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.32614/cran.package.mice</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Romero-Garcia</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Badenes</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lora-Pablos</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Gómez de la Cámara</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Extremely missing numerical data in electronic health records for machine learning can be managed through simple imputation methods considering informative missingness: a comparative of solutions in a COVID-19 mortality case study</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2023</year>
          <volume>242</volume>
          <fpage>107803</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0169-2607(23)00469-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2023.107803</pub-id>
          <pub-id pub-id-type="medline">37703700</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(23)00469-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Principal component analysis</article-title>
          <source>WIREs Comput Stat</source>
          <year>2010</year>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>433</fpage>
          <lpage>459</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/wics.101"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/wics.101</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breunig</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Kriegel</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Sander</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>LOF: identifying density-based local outliers</article-title>
          <year>2000</year>
          <conf-name>SIGMOD/PODS00: ACM International Conference on Management of Data and Symposium on Principles of Database Systems</conf-name>
          <conf-date>May 15-18, 2000</conf-date>
          <conf-loc>Dallas, TX, United States</conf-loc>
          <fpage>93</fpage>
          <lpage>104</lpage>
          <pub-id pub-id-type="doi">10.1145/342009.335388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greenacre</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blasius</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Multiple Correspondence Analysis and Related Methods. 1st Edition</source>
          <year>2006</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>Chapman and Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Rossum</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Drake</surname>
              <given-names>FL</given-names>
            </name>
          </person-group>
          <article-title>Python reference manual</article-title>
          <source>Centrum voor Wiskunde en Informatica</source>
          <year>1995</year>
          <access-date>2025-10-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ir.cwi.nl/pub/5008">https://ir.cwi.nl/pub/5008</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Millman</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>van der Walt</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gommers</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Virtanen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wieser</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Picus</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoyer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>van Kerkwijk</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haldane</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Del Río</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Wiebe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gérard-Marchant</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sheppard</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weckesser</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Abbasi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gohlke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Oliphant</surname>
              <given-names>TE</given-names>
            </name>
          </person-group>
          <article-title>Array programming with NumPy</article-title>
          <source>Nature</source>
          <year>2020</year>
          <volume>585</volume>
          <issue>7825</issue>
          <fpage>357</fpage>
          <lpage>362</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32939066"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-020-2649-2</pub-id>
          <pub-id pub-id-type="medline">32939066</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-020-2649-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7759461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKinney</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Data structures for statistical computing in Python</article-title>
          <year>2010</year>
          <conf-name>Proceedings of the 9th Python in Science Conference (Vol 445)</conf-name>
          <conf-date>June 28-July 3, 2010</conf-date>
          <conf-loc>Austin, TX, United States</conf-loc>
          <fpage>51</fpage>
          <lpage>56</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.scipy.org/articles/Majora-92bf1922-00a"/>
          </comment>
          <pub-id pub-id-type="doi">10.25080/majora-92bf1922-00a</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa, E</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2014.00014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Halford</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>prince</article-title>
          <source>GitHub</source>
          <year>2025</year>
          <access-date>2025-10-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/MaxHalford/prince">https://github.com/MaxHalford/prince</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blasco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blanes</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>bdslab-upv/dq_cancerless_analysis</article-title>
          <source>GitHub</source>
          <access-date>2025-10-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/bdslab-upv/dq_cancerless_analysis">https://github.com/bdslab-upv/dq_cancerless_analysis</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Toro</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Dworsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fowler</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Homeless youth in the United States: recent research findings and intervention approaches</article-title>
          <year>2007</year>
          <conf-name>National Symposium on Homelessness Research (Vol 6)</conf-name>
          <conf-date>March 1-2, 2007</conf-date>
          <conf-loc>Washington DC</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/237287723_6-_Homeless_Youth_in_the_United_States_Recent_Research_Findings_and_Intervention_Approaches"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="web">
          <article-title>European Health Data Space Regulation</article-title>
          <source>European Commission</source>
          <year>2024</year>
          <access-date>2024-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://health.ec.europa.eu/ehealth-digital-health-and-care/european-health-data-space_en">https://health.ec.europa.eu/ehealth-digital-health-and-care/european-health-data-space_en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
