<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i8e27842</article-id>
      <article-id pub-id-type="pmid">34346902</article-id>
      <article-id pub-id-type="doi">10.2196/27842</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Quality of Hospital Electronic Health Record (EHR) Data Based on the International Consortium for Health Outcomes Measurement (ICHOM) in Heart Failure: Pilot Data Quality Assessment Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Myreteg</surname>
            <given-names>Gunilla</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Beerten</surname>
            <given-names>Simon</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Aerts</surname>
            <given-names>Hannelore</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8806-7482</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Kalra</surname>
            <given-names>Dipak</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2998-9882</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Sáez</surname>
            <given-names>Carlos</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2678-8249</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ramírez-Anguita</surname>
            <given-names>Juan Manuel</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8509-0927</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Mayer</surname>
            <given-names>Miguel-Angel</given-names>
          </name>
          <degrees>MD, PhD, MPH</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Research Programme on Biomedical Informatics</institution>
            <institution>Hospital del Mar Medical Research Institute and Universitat Pompeu Fabra</institution>
            <addr-line>C/ Dr Aiguader 88</addr-line>
            <addr-line>Barcelona, 08003</addr-line>
            <country>Spain</country>
            <phone>34 933 160 539</phone>
            <email>miguelangel.mayer@upf.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0362-6298</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Garcia-Gomez</surname>
            <given-names>Juan M</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3851-1557</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Durà-Hernández</surname>
            <given-names>Marta</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8269-9753</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Thienpont</surname>
            <given-names>Geert</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4257-1624</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Coorevits</surname>
            <given-names>Pascal</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6515-7514</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Medical Informatics and Statistics Unit, Department of Public Health and Primary Care</institution>
        <institution>Faculty of Medicine and Health Sciences</institution>
        <institution>Ghent University</institution>
        <addr-line>Ghent</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>The European Institute for Innovation through Health Data (i~HD)</institution>
        <addr-line>Ghent</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Biomedical Data Science Lab</institution>
        <institution>Instituto Universitario de Tecnologías de la Información y Comunicaciones</institution>
        <institution>Universitat Politècnica de València</institution>
        <addr-line>Valencia</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Research Programme on Biomedical Informatics</institution>
        <institution>Hospital del Mar Medical Research Institute and Universitat Pompeu Fabra</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Research in Advanced Medical Informatics and Telematics (RAMIT)</institution>
        <addr-line>Ghent</addr-line>
        <country>Belgium</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Miguel-Angel Mayer <email>miguelangel.mayer@upf.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>8</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>4</day>
        <month>8</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>8</issue>
      <elocation-id>e27842</elocation-id>
      <history>
        <date date-type="received">
          <day>9</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>3</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>5</day>
          <month>6</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Hannelore Aerts, Dipak Kalra, Carlos Sáez, Juan Manuel Ramírez-Anguita, Miguel-Angel Mayer, Juan M Garcia-Gomez, Marta Durà-Hernández, Geert Thienpont, Pascal Coorevits. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 04.08.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/8/e27842" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>There is increasing recognition that health care providers need to focus attention, and be judged against, the impact they have on the health outcomes experienced by patients. The measurement of health outcomes as a routine part of clinical documentation is probably the only scalable way of collecting outcomes evidence, since secondary data collection is expensive and error-prone. However, there is uncertainty about whether routinely collected clinical data within electronic health record (EHR) systems includes the data most relevant to measuring and comparing outcomes and if those items are collected to a good enough data quality to be relied upon for outcomes assessment, since several studies have pointed out significant issues regarding EHR data availability and quality.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In this paper, we first describe a practical approach to data quality assessment of health outcomes, based on a literature review of existing frameworks for quality assessment of health data and multistakeholder consultation. Adopting this approach, we performed a pilot study on a subset of 21 International Consortium for Health Outcomes Measurement (ICHOM) outcomes data items from patients with congestive heart failure.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>All available registries compatible with the diagnosis of heart failure within an EHR data repository of a general hospital (142,345 visits and 12,503 patients) were extracted and mapped to the ICHOM format. We focused our pilot assessment on 5 commonly used data quality dimensions: completeness, correctness, consistency, uniqueness, and temporal stability.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We found high scores (&#62;95%) for the consistency, completeness, and uniqueness dimensions. Temporal stability analyses showed some changes over time in the reported use of medication to treat heart failure, as well as in the recording of past medical conditions. Finally, the investigation of data correctness suggested several issues concerning the characterization of missing data values. Many of these issues appear to be introduced while mapping the IMASIS-2 relational database contents to the ICHOM format, as the latter requires a level of detail that is not explicitly available in the coded data of an EHR.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Overall, results of this pilot study revealed good data quality for the subset of heart failure outcomes collected at the Hospital del Mar. Nevertheless, some important data errors were identified that were caused by fundamentally different data collection practices in routine clinical care versus research, for which the ICHOM standard set was originally developed. To truly examine to what extent hospitals today are able to routinely collect the evidence of their success in achieving good health outcomes, future research would benefit from performing more extensive data quality assessments, including all data items from the ICHOM standards set and across multiple hospitals.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data quality</kwd>
        <kwd>electronic health records</kwd>
        <kwd>heart failure</kwd>
        <kwd>value-based health insurance</kwd>
        <kwd>patient outcome assessment</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Increasing quantities of health data are being collected across care organizations, creating a powerful opportunity to learn from these data how to improve patient care and accelerate research. The earliest call to action and formalized approach for using health data to assess quality of care was probably the Donabedian model of quality [<xref ref-type="bibr" rid="ref1">1</xref>]. He categorized the assessment of health care quality under structure (how services are organized and resourced), process (how care is delivered and what care activities are undertaken), and outcome (what health impact it has). Over the decades, it has proved much easier to develop and implement audits of structure or process, but formalized assessments of outcome appear to be more challenging because it is harder to define what we mean by outcomes and how best to measure them [<xref ref-type="bibr" rid="ref2">2</xref>]. A formalized approach to measuring health outcomes was proposed by Porter and Teisberg [<xref ref-type="bibr" rid="ref3">3</xref>], within their model of the assessment of “value” in a seminal publication in 2006. Within this value equation, outcomes were defined as “the outcomes that matter to patients and the costs to achieve those outcomes” [<xref ref-type="bibr" rid="ref3">3</xref>]. This “Value-Based Health Care” model has grown into a portfolio of health outcomes standards for measuring value, developed and promoted by the International Consortium for Health Outcomes Measurement (ICHOM). These health outcomes standards, formalized as indicators to be collected, quantified, and compared between health care providers, have stimulated a global interest in benchmarking and comparing health outcomes [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>All these models hinge upon the essential ability to measure health, health care, and its outcomes. Health data are therefore a vital ingredient. To enable accurate measurement, data have to be captured and represented to a high quality. Unreliable data, such as incomplete, incorrect, or missing data entries, will inevitably lead to biased analyses, resulting in misdirected efforts to improve quality or false research interpretations.</p>
      <p>Yet, several studies have pointed out significant issues regarding availability and quality of electronic health record (EHR) data [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. For example, the “Electronic Health Records for Clinical Research” project, funded by the Innovative Medicine Initiative, clearly demonstrated that many variables, among which even fundamental ones such as patient weight, are frequently not present within EHR systems [<xref ref-type="bibr" rid="ref8">8</xref>]. Incorrect or absent recording of patient weights, though, can lead to medication dosage errors. Hirata and colleagues [<xref ref-type="bibr" rid="ref11">11</xref>] examined the frequency and consequences of weight errors that occurred across 79,000 emergency department encounters of children under the age of 5 years. They revealed that, although weight errors were relatively rare (0.63%), a large proportion of weight errors led to subsequent medication-dosing errors (34%). An earlier study by Selbst and colleagues [<xref ref-type="bibr" rid="ref12">12</xref>] also investigated the consequences of medication errors in a paediatric emergency department. They found that almost half of patients required additional monitoring (30%), examination (6%), or treatment (12%) after medication errors resulting from weight errors. To obtain reliable outcome measures from routinely collected EHR data, Sáez et al [<xref ref-type="bibr" rid="ref10">10</xref>] developed a national, standardized, data quality–assessed, integrated data repository on maternal-child care. During this process, they found that variability in data quality across hospital sites could lead to imprecise comparison of measurements. Moreover, data quality indices, the efficiency of research processes, and the reliability of subsequent results have been found to improve if patient records are assessed for data quality [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Hence, quality assessment of source health data is crucial to identify and mitigate data quality problems for proper data use and reuse.</p>
      <p>In this paper, we first describe our practical approach to quality assessment of health outcomes data. Adopting this methodology, we performed a pilot study on a subset of ICHOM outcomes data collected during routine clinical care of patients with congestive heart failure (CHF) in a general hospital, given the high prevalence and margin for outcomes improvement in heart failure [<xref ref-type="bibr" rid="ref15">15</xref>]. Assessing data quality of outcomes data obtained during routine clinical care is of great interest since ICHOM indicators are currently collected through dedicated data collection into specialist outcome measurement systems, which results in useful data but is not a scalable process. The complexity of the analysis and in selecting the diagnosis for more than one condition, as well as the comorbidities associated with each disease, the different treatments received in each case, and all the variables used in the analysis, make it very difficult to conduct a system-wide quality assessment including several diseases and to interpret the results of a multiple disease analysis.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Quality Assessment</title>
        <p>Research into data quality has gained attention since the seminal work by Wang and Strong [<xref ref-type="bibr" rid="ref16">16</xref>], who proposed a comprehensive “fit-for-use” data quality assessment framework using data quality dimensions. Since then, several studies have aimed to define data quality dimensions and methodologies to describe and measure the complex multidimensional aspects of data quality [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. Across studies, little agreement exists about the exact definition and meaning of data quality dimensions. Despite differences in terminology, though, many of the proposed dimensions and solutions aim to address conceptually similar data quality features [<xref ref-type="bibr" rid="ref14">14</xref>]. </p>
        <p>Following a review of existing literature, the data quality task force of the European Institute for Innovation through Health Data (i~HD) [<xref ref-type="bibr" rid="ref21">21</xref>] identified 9 frameworks for quality assessment of health data [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. From these frameworks, 9 data quality dimensions were selected during a series of workshops with clinical care, clinical research, and information and communication technology leads from 70 European hospitals: completeness, consistency, correctness, uniqueness, stability, timeliness, trustworthiness, contextualization, and representativeness. The selected data quality dimensions were deemed most important to assess the quality of health data if these data are to be useful for patient care, organizational learning (quality improvement, such as the assessment of health outcomes), and research (big data research and case finding for clinical trial recruitment). <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides an overview of the selected data quality dimensions, together with their original terminology; the completeness, consistency, correctness, uniqueness, and stability dimensions were the most commonly used in the data quality literature, and for this reason, we selected them for the quality assessment in this study [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. For instance, trustworthiness and timeliness are based on some types of metadata that are not usually available or accessible in EHR. Although sometimes the first 3 can overlap in their definitions or be contained within each other, we prefer making them orthogonal. For instance, a patient observation is incomplete if it is not registered, inconsistent if it does not comply with formatting requirements, or incorrect if it is unlikely to be true for a specific patient. For example, multiple normal kidney blood test results for a patient on dialysis would be consistent, though incorrect. Uniqueness, in turn, assesses whether duplications are present among patient records, for example as a result of an incomplete merging of patient records between hospital departments.</p>
        <p>Further, stability relates to the probabilistic concordance of data among different data sources such as hospitals, physicians, or devices or over time [<xref ref-type="bibr" rid="ref28">28</xref>]. For example, variability among centers has been found in liver offer acceptance rates for pediatric patients and cannot be explained by donor and recipient factors [<xref ref-type="bibr" rid="ref29">29</xref>]. In some cases, standardization of procedures and analyses can reduce levels of variability. However, sometimes differences among centers persist even when using standard procedures, for instance, between diffusion tensor magnetic resonance imaging findings obtained at different acquisition centers using a standard protocol [<xref ref-type="bibr" rid="ref30">30</xref>]. Likewise, when data are collected over time, temporal changes can occur due to several reasons, including changes in clinical practice or coding scheme used in the EHR [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Next, timeliness describes how promptly information is processed or how current recorded information is, for instance, to evaluate whether a current medication list within an EHR system is up to date or if there is a delay in updating this from a pharmacy subsystem. Trustworthiness relates to the availability of registry governance metadata and the data owner’s reputation. For example, it must be possible for someone accessing a health data item or clinical document to confidently know when and where it was captured, by whom, and if it has been modified since the original entry. Further, contextualization relates to whether the data are annotated with their acquisition context, which can be crucial for correct interpretation of the results, for instance, whether blood glucose laboratory results were obtained while the patient was fasting. Finally, representativeness captures whether a dataset is representative for the population from which it is supposed to be drawn, in order to allow valid inference. </p>
      </sec>
      <sec>
        <title>Pilot Assessment</title>
        <sec>
          <title>Dataset </title>
          <p>For this pilot assessment, we used data from the Parc Salut Mar Barcelona, a complete health care services organization with its information system database (IMASIS) as EHR. IMASIS includes and shares clinical information from 2 general hospitals, 1 mental health care center, 1 social health care center, and 5 emergency rooms in the Barcelona city area (Spain). IMASIS contains clinical information from approximately 1.5 million patients who have used the services of this health care system since 1989, across different settings such as admissions, outpatient consultations, emergency room visits, and major ambulatory surgery appointments. IMASIS-2 is the anonymized relational database of IMASIS that was created during the European Medical Information Framework (EMIF) project [<xref ref-type="bibr" rid="ref32">32</xref>] and is the data source used for research purposes. It contains structured data related to diagnosis, procedures, drug administration, and laboratory tests and clinical annotations in a free-text format. Since natural language processing falls beyond the scope of this project, we only used structured data. The study protocol was approved by the Ethics Committee of Parc Salut Mar (num. 2016/6935/I), under the research activities related to ischemic heart disease carried out during the EMIF project funded by the Innovative Medicines Initiative.</p>
          <p>As a case study, data from patients diagnosed with CHF were used. Heart failure is a chronic condition, severely impacting people’s quality of life. With a prevalence of over 23 million worldwide, it poses a significant public health problem [<xref ref-type="bibr" rid="ref33">33</xref>]. Collecting meaningful data on the health status of heart failure patients is therefore an important step to ensure better quality care and as a result, better quality of life for these patients.</p>
          <p>All patients (n=502,620) who attended the hospital at least once between January 1, 2006 and November 7, 2017 and who had at least one diagnosis entry of CHF were extracted from the IMASIS-2 database. Specifically, the selection of patients was based on the following diagnosis codes of the International Classification of Diseases ninth edition (ICD-9): 428, 428.0, 428.1, 428.2, 428.20, 428.21, 428.22, 428.23, 428.3, 428.30, 428.31, 428.32, 428.33, 428.4, 428.40, 428.41, 428.42, 428.43, 428.9. In total, the dataset included 142,345 patient visit records describing the medical history of 12,503 different patients who had one or more of these diagnoses. <xref rid="figure1" ref-type="fig">Figure 1</xref> provides a flow diagram of the different steps that were performed to obtain our study dataset. The main steps followed in the study were (1) a data anonymization process, (2) selection of the ICD-9 codes to select patients with CHF, (3) mapping data and variables included in the study to the IHCOM standard format, and (4) quality dimensions analysis.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Overview of the procedure to identify the patients to generate the study dataset.</p>
            </caption>
            <graphic xlink:href="medinform_v9i8e27842_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The ICHOM heart failure outcomes standard set [<xref ref-type="bibr" rid="ref13">13</xref>] was chosen as the most appropriate source of outcome indicators to target. Of the total of 72 ICHOM data items, a subset of 21 variables was selected as being most likely to be routinely collected within the hospital for patients with CHF and to be indicative of the overall quality of data collected for this type of patient. In addition, these variables allowed us to have complete information for the main characteristics of patients including age and sex as well as relevant comorbidities, such as hypertension or diabetes mellitus, and some of the most frequent treatments received for CHF, such as beta blockers, diuretics, and digoxin. The 21 variables were organized in 6 areas: identifiers, demographic factors, baseline health status, treatment variables, burden of care, and mortality. In addition, a visit identifier was included to distinguish different patient visit records. An overview of all variables included in the pilot assessment can be found in <xref ref-type="table" rid="table1">Table 1</xref>. In addition, <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> shows the ICD-9 codes used to identify baseline health status variables, and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> shows the Anatomical Therapeutic Chemical classification system codes of the World Health Organization [<xref ref-type="bibr" rid="ref34">34</xref>] to retrieve patients’ medication usage. </p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Overview of International Consortium for Health Outcomes Measurement (ICHOM) variables used in the pilot assessment.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="250"/>
              <col width="0"/>
              <col width="420"/>
              <col width="0"/>
              <col width="300"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Item</td>
                  <td colspan="2">Definition</td>
                  <td>Response options</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Identifiers</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Patient ID</td>
                  <td colspan="2">Patient’s medical record number</td>
                  <td colspan="2">According to institution</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Visit ID</td>
                  <td colspan="2">Unique visit record identifier</td>
                  <td colspan="2">Not included in the ICHOM standard set</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Demographic factors</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Age</td>
                  <td colspan="2">Date of birth</td>
                  <td colspan="2">DD/MM/YYYY</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Sex</td>
                  <td colspan="2">Sex at birth</td>
                  <td colspan="2">1=Male, 2=Female</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Baseline health status</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Atrial fibrillation</td>
                  <td colspan="2">Ever diagnosed with atrial fibrillation</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Prior myocardial infarction</td>
                  <td colspan="2">Ever diagnosed with myocardial infarction</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hypertension</td>
                  <td colspan="2">History of hypertension</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Diabetes mellitus</td>
                  <td colspan="2">Ever diagnosed with diabetes mellitus</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Echocardiogram performed</td>
                  <td colspan="2">Echocardiogram performed to assess ejection fraction</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Height</td>
                  <td colspan="2">Height (cm)</td>
                  <td colspan="2">Numeric value of height in the metric system</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Weight</td>
                  <td colspan="2">Weight (kg)</td>
                  <td colspan="2">Numeric value of weight in the metric system</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Alcohol use</td>
                  <td colspan="2">Consumption of &#62;1 alcoholic drink a day</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Smoking status</td>
                  <td colspan="2">Current smoking status</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown<break/>  <break/>  
              <break/>  <break/>  <break/>  </td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Treatment variables</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Beta blocker</td>
                  <td colspan="2">Beta blockers currently prescribed for heart failure</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Calcium channel blocker</td>
                  <td colspan="2">Calcium channel blockers currently prescribed for heart failure</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Digoxin</td>
                  <td colspan="2">Digoxin currently prescribed for heart failure</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Diuretics</td>
                  <td colspan="2">Diuretics currently prescribed for heart failure</td>
                  <td colspan="2">0=No, 1=Yes, 999=Unknown<break/>  <break/>  </td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Burden of care</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Date of arrival</td>
                  <td colspan="2">Date of admittance</td>
                  <td colspan="2">DD/MM/YYYY</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Date of discharge</td>
                  <td colspan="2">Date of discharge</td>
                  <td colspan="2">DD/MM/YYYY</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hospital admissions</td>
                  <td colspan="2">Number of hospitalizations in last 12 months due to heart failure</td>
                  <td colspan="2">Numerical value or 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hospital appointments</td>
                  <td colspan="2">Number of hospital appointments in last 12 months due to heart failure</td>
                  <td colspan="2">Numerical value or 999=Unknown</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Mortality</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Date of death</td>
                  <td colspan="2">Date patient was declared dead</td>
                  <td colspan="2">DD/MM/YYYY or 999=Unknown</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <p>Anonymized data on patients, visits, diagnosis, procedures, drug administration events, laboratory tests and patient measures were collected from the relational database IMASIS-2 where all these fact tables are connected to the patient table via the patient identifier. In addition, visit, diagnosis, and procedures are connected to each other via the visit identifiers, whereas drugs, laboratory, and patient measures are connected to all domains via date matching. Specific queries requesting data from each of these tables yielded the “Temporary datasets” that were subjected to several transformation steps and to a successive left outer join merging process in which patient and visit identifiers were set as the initial left dataset. As a result, data were organized in a “visit-centered” fashion (every row contains all data related to a visit), thus providing the final dataset according to the ICHOM format.</p>
        </sec>
        <sec>
          <title>Data Quality Dimensions</title>
          <p>To evaluate the quality of heart failure patient data collected during routine clinical care, a subset of 5 data quality dimensions was selected: completeness, correctness, consistency, uniqueness, and stability. These dimensions are most commonly used in the data quality literature and were deemed most interesting to assess given the nature of the data.</p>
          <p>First, for <italic>uniqueness</italic>, we measured the frequency with which partially duplicated patient records occur. Second, for <italic>consistency</italic>, we assessed data compliance with their expected data type (percentage of fields of a different type than defined), value range (percentage of fields out of the expected range), and basic multivariate rules (percentage of data not fulfilling rules; for example, patient’s arrival date should be before or equal to their date of discharge) [<xref ref-type="bibr" rid="ref10">10</xref>]. Next, for <italic>completeness,</italic> we measured the proportion of complete fields per variable. Further, for <italic>stability</italic>, we qualitatively evaluated the temporal stability of recorded past medical conditions and usage of different types of medications. To this end, we computed, per month, how many patient visit records mentioned a history of a particular medical condition or usage of a specific medication out of the total number of patient visit records that month. We then visualized trends for each of these data items by plotting the respective relative frequencies over time. Finally, we inferred data correctness from the data, either by combining information across variables or by investigating data from the same patient over time. Specifically, plausibility of height and weight was examined by computing patients’ BMIs. Further, we investigated the temporal order of past medical conditions, assuming that once a hospital visit record indicates that a patient has a history of atrial fibrillation, hypertension, diabetes, or myocardial infarction, the history of this diagnosis or event should be mentioned in all subsequent visit records. Based on this assumption, for assessment purposes, some deviations from this temporal order (ie, “history” followed by “no history”) point to data errors in the extracted dataset.</p>
        </sec>
        <sec>
          <title>Tools</title>
          <p>We conducted the data quality assessment using R, version 3.6.1 [<xref ref-type="bibr" rid="ref35">35</xref>]. For the temporal stability analyses, we used the EHRtemporalVariability R package [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Uniqueness</title>
        <p>Of a total of 142,345 patient visit records, 1.2% had identical visit identifiers even though values for one or more data items had different inputs (Uniqueness result 1=98.8%). In turn, 2.8% of all patient visit records had at least another record with a different visit identifier registered the same day and identical clinical data (Uniqueness result 2=97.2%). In IMASIS-2, visits and clinical data are connected via date matching. Therefore, for 1 patient attending 2 visits in the same day, both visits are connected to the same data. This amounts to an average score of 98% for uniqueness.</p>
      </sec>
      <sec>
        <title>Consistency</title>
        <p>Consistency by type and by multivariate rules both yielded a score of 100%; all values were in the right format, and no errors in relationships between dates were found. As a third consistency check, we examined whether numerical and date values fell within prespecified ranges and whether categorical variables had values that complied with predefined response options. An average score of 91.21% was obtained for consistency by range, resulting from errors in 3 variables. In particular, 85% of values for height and weight were “0.” Since weight and height values of zero do not have a physical meaning, we hypothesized that these data points were missing data values. Indeed, zero entries are not even permitted in the structured data fields of height and weight. Rather, these zero values were introduced during data extraction from the IMASIS-2 database to indicate missingness, since only numeric values are accepted for height and weight according to the ICHOM Heart Failure data dictionary (summarized in <xref ref-type="table" rid="table1">Table 1</xref>). In addition, a small number of out-of-range data points were identified for height (n=54) and weight (n=20). Further, 16 visit records had arrival dates before January 1, 2006. Across the 3 domains of consistency, this yields an average score of 97.07%.</p>
      </sec>
      <sec>
        <title>Completeness</title>
        <p>Assessing completeness of the dataset by column revealed that all included variables were completely documented, except for date of death, which was only recorded in 37.14% of all patient visits. This incompleteness is valid, though, since date of death is only provided when the patient died during the visit. Excluding this valid incompleteness result, an average score of 100% was obtained for completeness.</p>
      </sec>
      <sec>
        <title>Stability</title>
        <p>Two categories of data items were assessed for temporal variability: medication usage and past medical conditions. As illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>, the results showed a gradual increase over time in the recorded usage of different types of medication to treat heart failure, especially of beta blockers and diuretics. Further, we found an abrupt change in the documentation pattern of past medical conditions in 2011, with drastically reduced frequencies of reported past medical conditions (<xref rid="figure3" ref-type="fig">Figure 3</xref>). Of note, only a small number of patient visit records (&#60;10) was available for each month in the first half of 2016, explaining the absent or divergent results.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Percentage of patients with a record of specific drug usage per month, relative to the total number of patient admissions within that month, plotted over time.</p>
          </caption>
          <graphic xlink:href="medinform_v9i8e27842_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Percentage of patients with a record of a specific past medical condition per month, relative to the total number of patient admissions within that month, plotted over time. MI=myocardial infarction.</p>
          </caption>
          <graphic xlink:href="medinform_v9i8e27842_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Correctness</title>
        <p>After performing basic descriptive analyses, results of which are summarized in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>, 2 sets of variables were subjected to closer inspection. First, correctness of height and weight values was evaluated based on their bivariate distribution, as shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>. All data points that fall below the main diagonal, implying that the patient’s weight (in kg) is larger than his or her height (in cm), are very unlikely to be true. A subset of these data errors, highlighted by the red circle, were hypothesized to result from value inversion between height and weight recordings. To formally assess implausible height and weight values, we computed the patients’ BMIs. Results showed that 16 patients had a suspiciously low BMI (&#60;10 kg/m<sup>2</sup>), and 180 patients had an implausibly high BMI (&#62;70 kg/m<sup>2</sup>). Hence, a total of 196 probable errors were identified, corresponding to 0.13% of all patient visit records.</p>
        <p>Further, we investigated the temporal order of past medical conditions. Results showed a substantial number of deviations. Specifically, 6.33% of all patient visit records mentioned that the patient did not have a history of atrial fibrillation, while earlier records indicated the patient had previously been diagnosed with atrial fibrillation. Similarly, for history of hypertension, diabetes mellitus, and myocardial infarction, error rates of 12.11%, 6.12%, and 12.11%, respectively, were obtained. These deviations in temporal order were introduced while mapping the IMASIS-2 relational database contents to the ICHOM format, as the latter requires a level of detail that is not explicitly available in the coded data of an EHR. In particular, diagnoses or events already recorded in a previous visit and not mentioned in a subsequent visit are not consistently recorded in EHR systems during routine clinical care, in contrast to data collected for research purposes. It is therefore practically impossible to distinguish true negatives from missing data when extracting data from the EHR. As a result, a substantial proportion of patient history data items that were negative in the dataset actually represent missing data values. Taken together, this amounts to a total score of 93.84% for correctness.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Bivariate distribution of height and weight values, with the red circle highlighting the data points where height and weight values were hypothesized to have been inverted.</p>
          </caption>
          <graphic xlink:href="medinform_v9i8e27842_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Data Quality Assessment Results and Suggestions for Improvement</title>
        <p>Overall, this pilot assessment revealed high scores on each of the dimensions used to investigate the quality of heart failure patients’ data. Nevertheless, several data quality issues were identified, based on which we propose a set of improvement strategies.</p>
        <p>Regarding consistency, results of our data quality assessment showed that a substantial number of negative values in the dataset — indicating the absence of a particular data item — actually represented missing data. Consequently, some variable distributions seem to be biased. For example, according to the data, only a minority of patients currently smoked or had a past medical condition such as hypertension (see <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>), which is rather implausible for a population of patients with heart failure. This is an intrinsic issue associated with structured data sources in the framework of EHR databases. That is, when a code is not found in the EHR, it is practically impossible to distinguish whether the code is negative (ie, examination has confirmed the absence of a particular condition) or missing (ie, no examination has taken place, or examination confirmed the presence of a particular condition but is not recorded in a structured format) for a given patient. We are aware that good clinical practice does not mandate the measurement of every data item at each patient visit (eg, disease history), since these items usually are present as additional information in a typical EHR environment. Nevertheless, this differs fundamentally from data collection practices in the context of research activities such as outcomes assessment, for which the ICHOM standard set was originally developed. When performing analytical and research activities, it would therefore be very useful to introduce mechanisms or tools that allow differentiation of data missingness from true negatives and to determine the duration of each condition and disease, regardless of whether they are mentioned in each visit.</p>
        <p>Further, the uniqueness analyses revealed some partially duplicated patient visit records. First, duplications in visit identifiers were found, while clinical data showed different inputs. Data management staff at the Hospital del Mar clarified that this happened whenever different height and weight measurements were registered during a single visit. If a slight difference between values is observed, partial row duplicates are generated when merging data in the final dataset. Second, duplicated rows with different visit identifiers have arisen because of the data organization in IMASIS-2, where some clinical data are connected to visit IDs via date matching. As a result, all clinical data collected during different patient visits on the same day are connected to different visit IDs depending on the department or hospital service where these patients visit even on the same day. To reduce future data quality issues of this kind, we suggest a data reorganization including a 2-level visit structure. First, a more general level would describe a period in which one or different visits occur and is connected to clinical data obtained within this period. Second, a more specific level would then describe every distinct visit together with a corresponding diagnosis and procedure information obtained during the particular visit. This 2-level visit organization would contribute to the elimination of partial replicates, thus positively impacting the uniqueness aspect of data quality. This strategy has been previously adopted by the Observational Medical Outcomes Partnership (OMOP) Common Data Model (CDM) standard [<xref ref-type="bibr" rid="ref37">37</xref>] with the aim of easing mappings from ambiguous visit-connected schemas.</p>
        <p>When analyzing and interpreting completeness, it is essential to take into account the type of information that is registered based on the characteristics of the database, for instance, in this case a hospital-based EHR in which information and variables related to death and data for death are only registered when this situation occurs during admission. For instance, the link among different registries and databases such as primary care, hospital, and mortality registries is essential to contribute to the completeness of this type of information.</p>
        <p>Temporal stability analyses revealed an abrupt change in the documentation pattern of past medical conditions in 2011, with drastically reduced frequencies of reported past medical conditions. For instance, the introduction of a new automated coding system in the emergency department EHR system accompanied an increase in the number of registries and codifications in this department and therefore in the system. Although we assume this evolution in the recording of past medical conditions had a positive impact on direct patient care, decision support and alert algorithms can be impacted by changes in diagnostic coding practice and should therefore be considered. In addition, these changes will affect the reuse of data for research and quality monitoring such as outcomes tracking. In this sense, quality assessment is an essential tool to detect the effects of changes in EHR systems introduced over time, which would contribute to a better understanding of the updates in the content and structure of these types of databases. Finally, regarding the important point related to the potential impact of changes or upgrades in EHR system and diagnostic coding practices due to common changes in the way diseases are coded or for instance the necessity to included new diseases, we recommend preparing carefully for this type of situation.</p>
        <p>In relation to correctness, many data items are often recorded in free text rather than structured data fields, making it difficult to extract this information for research and analysis purposes. We therefore advise to maximally include data items in form format or specific fields or sections in the EHR. In addition, when using form formats, we recommend the use of alarms for avoiding missing values as well as for inputting out-of-range data. Alternatively, natural language processing techniques applied to free-text clinical annotation fields can be used to enrich structured sources.</p>
      </sec>
      <sec>
        <title>Lessons Learned</title>
        <p>The process of assessing the quality of outcomes data obtained during routine clinical care is of great value and allows us the opportunity to learn several relevant aspects in the management and evaluation of clinical information in EHR environments. The most relevant lessons learned were (1) the evaluation requires having considerable knowledge of the EHR (data available, how the data were collected, or who collected it) to fully understand its structure and different staff needs; (2) it is critical that the metrics are feasible, valid, and meaningful for a specific EHR system and its quality evaluation and should be understood and used accordingly; (3) once the quality of the data is assessed, it is important to monitor it regularly, and the value of an external data quality assessment by an independent organization should be considered. In addition, high-quality data enhance the validity and reliability of study findings and thinking of using EHR systems for purposes other than health care such as research. Finally, it is interesting to consider that EHR models would need to be expanded and redesigned in content and structure, and a data quality assessment can assist in doing these tasks.</p>
      </sec>
      <sec>
        <title>Limitations and Future Directions</title>
        <p>In interpreting the results of this study, some important limitations should be taken into consideration. First, although the selection of a subset of ICHOM outcome variables for the data quality assessment was made in agreement among all the members of the study assessment based on the most likely routinely collected data within their EHR for patients with CHF, it is possible that the use of more variables or other variables could affect the results of the quality assessment. For this reason, whether the data quality results from this pilot assessment are generalizable to the complete ICHOM standard set has yet to be investigated. Similarly, we selected 5 of 9 available data quality dimensions, as these were thought to be most relevant given the nature of the data. It is possible that the use of all 9 dimensions would show a more complete analysis of this type of data and therefore would offer additional recommendations for improvement. Further, data quality assessment was performed on a data extract from the IMASIS-2 dataset after mapping the data items to the ICHOM outcomes format, which might have introduced additional errors. We therefore recommend future studies to examine the data quality of the EHR variables directly, in the hospital’s own response format, or to perform an additional data quality assessment of the mapping procedure.</p>
        <p>In sum, future research would benefit from performing more thorough data quality assessments, across multiple hospitals, to truly examine to what extent hospitals today are able to routinely collect the evidence of their success in achieving good health outcomes. The European Federation of Pharmaceutical Industries and Associations (EFPIA) is currently leading such a project together with i~HD. In particular, the goal of this project is to assess the availability and quality of routinely collected patient data to underpin a future scale-up of value-based care models in which ICHOM outcomes indicators serve as the measures of value delivered by health care provider organizations. For this project, data from patients with heart failure are also being examined, now using the complete set of ICHOM outcomes indicators and performing assessments across 10 European hospitals. The promotion of data quality is essential to advance learning health systems, patient empowerment, and clinical research, and the results of this larger project will provide interesting insights on the generalizability of this pilot project’s findings.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Mapping of data quality dimensions.</p>
        <media xlink:href="medinform_v9i8e27842_app1.docx" xlink:title="DOCX File , 27 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>ICD-9 classification codes used for the evaluation of baseline health status variables.</p>
        <media xlink:href="medinform_v9i8e27842_app2.docx" xlink:title="DOCX File , 13 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Anatomical Therapeutic Chemical classification system (ATC/DDD) codes of the World Health Organization used to retrieve patients’ medication usage.</p>
        <media xlink:href="medinform_v9i8e27842_app3.docx" xlink:title="DOCX File , 13 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Results of descriptive analyses.</p>
        <media xlink:href="medinform_v9i8e27842_app4.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CDM</term>
          <def>
            <p>Common Data Model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CHF</term>
          <def>
            <p>congestive heart failure</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EFPIA</term>
          <def>
            <p>European Federation of Pharmaceutical Industries and Associations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EMIF</term>
          <def>
            <p>European Medical Information Framework</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ICD-9</term>
          <def>
            <p>International Classification of Diseases ninth edition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ICHOM</term>
          <def>
            <p>International Consortium for Health Outcomes Measurement</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">i~HD</term>
          <def>
            <p>European Institute for Innovation through Health Data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">OMOP</term>
          <def>
            <p>Observational Medical Outcomes Partnership</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>MAM and JMRA had support from the Innovative Medicines Initiative Joint Under-taking under EMIF grant agreement no. 115372, resources of which are composed of financial contribution from the European Union’s Seventh Framework Programme (FP7/2007-2013) and EFPIA companies. The funders were not involved in the study design; in the collection, analysis, and interpretation of data; in the writing of the report; or in the decision to submit the article for publication.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>MAM and JMRA selected the variables to be included in the analysis and provided the data for analysis. HA performed data quality analyses, interpreted the results, and wrote the manuscript. CS and MDH performed data quality analyses. Baseline data quality assessment scripts in R were provided by CS, MDH, and JMGG. All authors interpreted the data quality analyses results, contributed to the writing of the manuscript, performed critical revisions of the manuscript, and approved the final version for publication.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Donabedian</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the Quality of Medical Care</article-title>
          <source>The Milbank Memorial Fund Quarterly</source>
          <year>1966</year>
          <month>07</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>166</fpage>
          <pub-id pub-id-type="doi">10.2307/3348969</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Brinker</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Challenges in outcome measurement: clinical research perspective</article-title>
          <source>Clin Orthop Relat Res</source>
          <year>2013</year>
          <month>11</month>
          <volume>471</volume>
          <issue>11</issue>
          <fpage>3496</fpage>
          <lpage>503</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23884806"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11999-013-3194-1</pub-id>
          <pub-id pub-id-type="medline">23884806</pub-id>
          <pub-id pub-id-type="pmcid">PMC3792254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Porter</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Teisberg</surname>
              <given-names>EO</given-names>
            </name>
          </person-group>
          <source>Redefining Health Care: Creating Value-Based Competition on Results</source>
          <year>2006</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>Harvard Business Review Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>International Consortium for Health Outcomes Measurement (ICHOM)</article-title>
          <source>Trials</source>
          <year>2015</year>
          <month>11</month>
          <day>24</day>
          <volume>16</volume>
          <issue>S3</issue>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1186/1745-6215-16-s3-o4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Botsis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hartvigsen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Secondary Use of EHR: Data Quality Issues and Informatics Opportunities</article-title>
          <source>Summit Transl Bioinform</source>
          <year>2010</year>
          <month>03</month>
          <day>01</day>
          <volume>2010</volume>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21347133"/>
          </comment>
          <pub-id pub-id-type="medline">21347133</pub-id>
          <pub-id pub-id-type="pmcid">PMC3041534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Fowles</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Review: electronic health records and the reliability and validity of quality measures: a review of the literature</article-title>
          <source>Med Care Res Rev</source>
          <year>2010</year>
          <month>10</month>
          <day>11</day>
          <volume>67</volume>
          <issue>5</issue>
          <fpage>503</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1177/1077558709359007</pub-id>
          <pub-id pub-id-type="medline">20150441</pub-id>
          <pub-id pub-id-type="pii">1077558709359007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daniel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Serre</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Orlova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bréant</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Paris</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Griffon</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Initializing a hospital-wide data quality program. The AP-HP experience</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2019</year>
          <month>11</month>
          <volume>181</volume>
          <fpage>104804</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2018.10.016</pub-id>
          <pub-id pub-id-type="medline">30497872</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(18)30624-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doods</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Botteri</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dugas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>F</given-names>
            </name>
            <collab>EHR4CR WP7</collab>
          </person-group>
          <article-title>A European inventory of common electronic health record data elements for clinical trial feasibility</article-title>
          <source>Trials</source>
          <year>2014</year>
          <month>01</month>
          <day>10</day>
          <volume>15</volume>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trialsjournal.biomedcentral.com/articles/10.1186/1745-6215-15-18"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1745-6215-15-18</pub-id>
          <pub-id pub-id-type="medline">24410735</pub-id>
          <pub-id pub-id-type="pii">1745-6215-15-18</pub-id>
          <pub-id pub-id-type="pmcid">PMC3895709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Hurdle</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Felgar</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Nebeker</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Direct text entry in electronic progress notes. An evaluation of input errors</article-title>
          <source>Methods Inf Med</source>
          <year>2003</year>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="medline">12695797</pub-id>
          <pub-id pub-id-type="pii">03010061</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moner</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>García-De-León-Chocano</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz-Soler</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>García-De-León-González</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Maldonado</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Boscá</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tortajada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Alcaraz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bernal</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bustos</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Esparza</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A Standardized and Data Quality Assessed Maternal-Child Care Integrated Data Repository for Research and Monitoring of Best Practices: A Pilot Project in Spain</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2017</year>
          <volume>235</volume>
          <fpage>539</fpage>
          <lpage>543</lpage>
          <pub-id pub-id-type="medline">28423851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirata</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>GV</given-names>
            </name>
            <name name-style="western">
              <surname>Kimata</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>LG</given-names>
            </name>
          </person-group>
          <article-title>Pediatric Weight Errors and Resultant Medication Dosing Errors in the Emergency Department</article-title>
          <source>Pediatr Emerg Care</source>
          <year>2019</year>
          <month>09</month>
          <volume>35</volume>
          <issue>9</issue>
          <fpage>637</fpage>
          <lpage>642</lpage>
          <pub-id pub-id-type="doi">10.1097/PEC.0000000000001277</pub-id>
          <pub-id pub-id-type="medline">28976456</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Selbst</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Fein</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Osterhoudt</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Medication errors in a pediatric emergency department</article-title>
          <source>Pediatr Emerg Care</source>
          <year>1999</year>
          <month>02</month>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1097/00006565-199902000-00001</pub-id>
          <pub-id pub-id-type="medline">10069301</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burns</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Arora</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Okunade</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Beltrame</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Bernardez-Pereira</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Crespo-Leiro</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Filippatos</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Hardman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hoes</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Hutchison</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jessup</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kinsella</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Knapton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Masoudi</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>McIntyre</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mindham</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Otterspoor</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Parker</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Persson</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Pinnock</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Reid</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stevenson</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>McDonagh</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>International Consortium for Health Outcomes Measurement (ICHOM): Standardized Patient-Centered Outcomes Measurement Set for Heart Failure Patients</article-title>
          <source>JACC Heart Fail</source>
          <year>2020</year>
          <month>03</month>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>212</fpage>
          <lpage>222</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2213-1779(19)30797-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jchf.2019.09.007</pub-id>
          <pub-id pub-id-type="medline">31838032</pub-id>
          <pub-id pub-id-type="pii">S2213-1779(19)30797-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7052736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22733976"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="medline">22733976</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savarese</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lund</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>Global Public Health Burden of Heart Failure</article-title>
          <source>Card Fail Rev</source>
          <year>2017</year>
          <month>04</month>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>7</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28785469"/>
          </comment>
          <pub-id pub-id-type="doi">10.15420/cfr.2016:25:2</pub-id>
          <pub-id pub-id-type="medline">28785469</pub-id>
          <pub-id pub-id-type="pmcid">PMC5494150</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>RY</given-names>
            </name>
            <name name-style="western">
              <surname>Strong</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Beyond Accuracy: What Data Quality Means to Data Consumers</article-title>
          <source>Journal of Management Information Systems</source>
          <year>2015</year>
          <month>12</month>
          <day>11</day>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>5</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1080/07421222.1996.11518099</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Batini</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cappiello</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Francalanci</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Maurino</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Methodologies for data quality assessment and improvement</article-title>
          <source>ACM Comput. Surv</source>
          <year>2009</year>
          <month>07</month>
          <volume>41</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1145/1541880.1541883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Speedie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Westra</surname>
              <given-names>BL</given-names>
            </name>
          </person-group>
          <article-title>A Data Quality Ontology for the Secondary Use of EHR Data</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>1937</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958293"/>
          </comment>
          <pub-id pub-id-type="medline">26958293</pub-id>
          <pub-id pub-id-type="pmcid">PMC4765682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Raebel</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Glanz</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Riedlinger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>A pragmatic framework for single-site and multisite data quality assessment in electronic health record-based clinical research</article-title>
          <source>Med Care</source>
          <year>2012</year>
          <month>07</month>
          <volume>50 Suppl</volume>
          <fpage>S21</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22692254"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e318257dd67</pub-id>
          <pub-id pub-id-type="medline">22692254</pub-id>
          <pub-id pub-id-type="pii">00005650-201207001-00008</pub-id>
          <pub-id pub-id-type="pmcid">PMC3833692</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rahimi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Taggart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dennis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>de Lusignan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jalaludin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yeo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Talaei-Khoei</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Towards an ontology for data quality in integrated chronic disease management: a realist review of the literature</article-title>
          <source>Int J Med Inform</source>
          <year>2013</year>
          <month>01</month>
          <volume>82</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2012.10.001</pub-id>
          <pub-id pub-id-type="medline">23122633</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(12)00193-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Stroetmann</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sundgren</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dupont</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schlünder</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Thienpont</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Coorevits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>De Moor</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The European Institute for Innovation through Health Data</article-title>
          <source>Learn Health Syst</source>
          <year>2017</year>
          <month>01</month>
          <day>25</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>e10008</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/lrh2.10008"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/lrh2.10008</pub-id>
          <pub-id pub-id-type="medline">31245550</pub-id>
          <pub-id pub-id-type="pii">LRH210008</pub-id>
          <pub-id pub-id-type="pmcid">PMC6516723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hammond</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Richesson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rusincovitch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Smerek</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Assessing Data Quality for Healthcare Systems Data Used in Clinical Research (Version 10)</source>
          <year>2014</year>
          <access-date>2021-07-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dcricollab.dcri.duke.edu/sites/NIHKR/KR/Assessing-data-quality_V1%200.pdf">https://dcricollab.dcri.duke.edu/sites/NIHKR/KR/Assessing-data-quality_V1%200.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davoudi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dooling</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Glondys</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kadlec</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Overgaard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ruben</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wendicke</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data Quality Management Model (2015 Update) - Retired</article-title>
          <source>The American Health Information Management Association</source>
          <year>2015</year>
          <access-date>2021-07-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://library.ahima.org/PB/DataQualityModel#.XW6r-pNKjab">http://library.ahima.org/PB/DataQualityModel#.XW6r-pNKjab</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Miranda</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Organizing data quality assessment of shifting biomedical data</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2012</year>
          <volume>180</volume>
          <fpage>721</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="medline">22874286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goerg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holve</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton-Lopez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meeker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A Harmonized Data Quality Assessment Terminology and Framework for the Secondary Use of Electronic Health Record Data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <month>09</month>
          <day>11</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27713905"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id>
          <pub-id pub-id-type="medline">27713905</pub-id>
          <pub-id pub-id-type="pii">egems1244</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Parkin</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of data quality in the cancer registry: principles and methods. Part I: comparability, validity and timeliness</article-title>
          <source>Eur J Cancer</source>
          <year>2009</year>
          <month>03</month>
          <volume>45</volume>
          <issue>5</issue>
          <fpage>747</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ejca.2008.11.032</pub-id>
          <pub-id pub-id-type="medline">19117750</pub-id>
          <pub-id pub-id-type="pii">S0959-8049(08)00920-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sariyar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Borg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heidinger</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pommerening</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A practical framework for data management processes and their evaluation in population-based medical registries</article-title>
          <source>Inform Health Soc Care</source>
          <year>2013</year>
          <month>03</month>
          <volume>38</volume>
          <issue>2</issue>
          <fpage>104</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.3109/17538157.2012.735731</pub-id>
          <pub-id pub-id-type="medline">23323639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zurriaga</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-Panadés</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Melchor</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Applying probabilistic temporal and multisite data quality control methods to a public health mortality registry in Spain: a systematic approach to quality control of repositories</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>11</month>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>1085</fpage>
          <lpage>1095</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocw010</pub-id>
          <pub-id pub-id-type="medline">27107447</pub-id>
          <pub-id pub-id-type="pii">ocw010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Loomes</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Squires</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Variability in acceptance of organ offers by pediatric transplant centers and its impact on wait-list mortality</article-title>
          <source>Liver Transpl</source>
          <year>2018</year>
          <month>06</month>
          <day>06</day>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>803</fpage>
          <lpage>809</lpage>
          <pub-id pub-id-type="doi">10.1002/lt.25048</pub-id>
          <pub-id pub-id-type="medline">29506323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pagani</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hirsch</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Pouwels</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Horsfield</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Perego</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gass</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roosendaal</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhof</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Agosta</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rovaris</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Caputo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Palace</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marino</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>De Stefano</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ropele</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fazekas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Filippi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Intercenter differences in diffusion tensor MRI acquisition</article-title>
          <source>J Magn Reson Imaging</source>
          <year>2010</year>
          <month>06</month>
          <volume>31</volume>
          <issue>6</issue>
          <fpage>1458</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.1002/jmri.22186</pub-id>
          <pub-id pub-id-type="medline">20512899</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>Carlos</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>Juan M</given-names>
            </name>
          </person-group>
          <article-title>Kinematics of Big Biomedical Data to characterize temporal variability and seasonality of data repositories: Functional Data Analysis of data temporal evolution over non-parametric statistical manifolds</article-title>
          <source>Int J Med Inform</source>
          <year>2018</year>
          <month>11</month>
          <volume>119</volume>
          <fpage>109</fpage>
          <lpage>124</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.09.015</pub-id>
          <pub-id pub-id-type="medline">30342679</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)30563-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lovestone</surname>
              <given-names>S</given-names>
            </name>
            <collab>EMIF Consortium</collab>
          </person-group>
          <article-title>The European medical information framework: A novel ecosystem for sharing healthcare data across Europe</article-title>
          <source>Learn Health Syst</source>
          <year>2020</year>
          <month>04</month>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e10214</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/lrh2.10214"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/lrh2.10214</pub-id>
          <pub-id pub-id-type="medline">32313838</pub-id>
          <pub-id pub-id-type="pii">LRH210214</pub-id>
          <pub-id pub-id-type="pmcid">PMC7156868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roger</surname>
              <given-names>VL</given-names>
            </name>
          </person-group>
          <article-title>Epidemiology of Heart Failure</article-title>
          <source>Circ Res</source>
          <year>2013</year>
          <month>08</month>
          <day>30</day>
          <volume>113</volume>
          <issue>6</issue>
          <fpage>646</fpage>
          <lpage>659</lpage>
          <pub-id pub-id-type="doi">10.1161/circresaha.113.300268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>Guidelines for ATC classification and DDD assignment, 2011</article-title>
          <source>WHO Collaborating Centre for Drug Statistics Methodology</source>
          <year>2010</year>
          <access-date>2021-07-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.whocc.no/filearchive/publications/2011guidelines.pdf">https://www.whocc.no/filearchive/publications/2011guidelines.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <article-title>R: A language and environment for statistical computing</article-title>
          <source>R Foundation for Statistical Computing</source>
          <year>2017</year>
          <access-date>2021-07-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.r-project.org">https://www.r-project.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez-Sacristán</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Avillach</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>EHRtemporalVariability: delineating temporal data-set shifts in electronic health records</article-title>
          <source>Gigascience</source>
          <year>2020</year>
          <month>08</month>
          <day>01</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/gigascience/article-lookup/doi/10.1093/gigascience/giaa079"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/gigascience/giaa079</pub-id>
          <pub-id pub-id-type="medline">32729900</pub-id>
          <pub-id pub-id-type="pii">5878826</pub-id>
          <pub-id pub-id-type="pmcid">PMC7391413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <article-title>The Book of OHDSI</article-title>
          <source>Observational Health Data Sciences and Informatics</source>
          <year>2021</year>
          <month>1</month>
          <day>11</day>
          <access-date>2021-07-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://book.ohdsi.org">http://book.ohdsi.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
