<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e44547</article-id>
      <article-id pub-id-type="pmid">36884279</article-id>
      <article-id pub-id-type="doi">10.2196/44547</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>An Ontology-Based Approach for Consolidating Patient Data Standardized With European Norm/International Organization for Standardization 13606 (EN/ISO 13606) Into Joint Observational Medical Outcomes Partnership (OMOP) Repositories: Description of a Methodology</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sánchez de Madariaga</surname>
            <given-names>Ricardo</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Azevedo Marques</surname>
            <given-names>Paulo</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Frid</surname>
            <given-names>Santiago</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Clinical Foundations Department</institution>
            <institution>Universitat de Barcelona</institution>
            <addr-line>Casanova 143</addr-line>
            <addr-line>Barcelona, 08036</addr-line>
            <country>Spain</country>
            <phone>34 934035258</phone>
            <email>santifrid@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8400-5770</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Pastor Duran</surname>
            <given-names>Xavier</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8267-7151</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Bracons Cucó</surname>
            <given-names>Guillem</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1274-7403</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Pedrera-Jiménez</surname>
            <given-names>Miguel</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0187-3826</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Serrano-Balazote</surname>
            <given-names>Pablo</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2958-6319</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Muñoz Carrero</surname>
            <given-names>Adolfo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0141-7751</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Lozano-Rubí</surname>
            <given-names>Raimundo</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7912-721X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Medical Informatics Unit</institution>
        <institution>Hospital Clínic de Barcelona</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Clinical Foundations Department</institution>
        <institution>Universitat de Barcelona</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Fundació Clínic per a la Recerca Biomédica</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Data Science Unit</institution>
        <institution>Hospital 12 de Octubre</institution>
        <addr-line>Madrid</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Direction of Planification</institution>
        <institution>Hospital 12 de Octubre</institution>
        <addr-line>Madrid</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Unit of Investigation in Telemedicine and Digital Health</institution>
        <institution>Instituto de Salud Carlos III</institution>
        <addr-line>Madrid</addr-line>
        <country>Spain</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Santiago Frid <email>santifrid@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>3</month>
        <year>2023</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e44547</elocation-id>
      <history>
        <date date-type="received">
          <day>23</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>5</day>
          <month>1</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Santiago Frid, Xavier Pastor Duran, Guillem Bracons Cucó, Miguel Pedrera-Jiménez, Pablo Serrano-Balazote, Adolfo Muñoz Carrero, Raimundo Lozano-Rubí. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 08.03.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2023/1/e44547" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>To discover new knowledge from data, they must be correct and in a consistent format. OntoCR, a clinical repository developed at Hospital Clínic de Barcelona, uses ontologies to represent clinical knowledge and map locally defined variables to health information standards and common data models.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of the study is to design and implement a scalable methodology based on the dual-model paradigm and the use of ontologies to consolidate clinical data from different organizations in a standardized repository for research purposes without loss of meaning.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>First, the relevant clinical variables are defined, and the corresponding European Norm/International Organization for Standardization (EN/ISO) 13606 archetypes are created. Data sources are then identified, and an extract, transform, and load process is carried out. Once the final data set is obtained, the data are transformed to create EN/ISO 13606–normalized electronic health record (EHR) extracts. Afterward, ontologies that represent archetyped concepts and map them to EN/ISO 13606 and Observational Medical Outcomes Partnership Common Data Model (OMOP CDM) standards are created and uploaded to OntoCR. Data stored in the extracts are inserted into its corresponding place in the ontology, thus obtaining instantiated patient data in the ontology-based repository. Finally, data can be extracted via SPARQL queries as OMOP CDM–compliant tables.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Using this methodology, EN/ISO 13606–standardized archetypes that allow for the reuse of clinical information were created, and the knowledge representation of our clinical repository by modeling and mapping ontologies was extended. Furthermore, EN/ISO 13606–compliant EHR extracts of patients (6803), episodes (13,938), diagnosis (190,878), administered medication (222,225), cumulative drug dose (222,225), prescribed medication (351,247), movements between units (47,817), clinical observations (6,736,745), laboratory observations (3,392,873), limitation of life-sustaining treatment (1,298), and procedures (19,861) were created. Since the creation of the application that inserts data from extracts into the ontologies is not yet finished, the queries were tested and the methodology was validated by importing data from a random subset of patients into the ontologies using a locally developed Protégé plugin (“OntoLoad”). In total, 10 OMOP CDM–compliant tables (“Condition_occurrence,” 864 records; “Death,” 110; “Device_exposure,” 56; “Drug_exposure,” 5609; “Measurement,” 2091; “Observation,” 195; “Observation_period,” 897; “Person,” 922; “Visit_detail,” 772; and “Visit_occurrence,” 971) were successfully created and populated.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study proposes a methodology for standardizing clinical data, thus allowing its reuse without any changes in the meaning of the modeled concepts. Although this paper focuses on health research, our methodology suggests that the data be initially standardized per EN/ISO 13606 to obtain EHR extracts with a high level of granularity that can be used for any purpose. Ontologies constitute a valuable approach for knowledge representation and standardization of health information in a standard-agnostic manner. With the proposed methodology, institutions can go from local raw data to standardized, semantically interoperable EN/ISO 13606 and OMOP repositories.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>health information interoperability</kwd>
        <kwd>health research</kwd>
        <kwd>health information standards</kwd>
        <kwd>dual model</kwd>
        <kwd>secondary use of health data</kwd>
        <kwd>Observational Medical Outcomes Partnership Common Data Model</kwd>
        <kwd>European Norm/International Organization for Standardization 13606</kwd>
        <kwd>health records</kwd>
        <kwd>ontologies</kwd>
        <kwd>clinical data</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The term primary use of health data encompasses the generation and use of data within the context of individual health care in hospitals and physicians’ offices to serve direct care needs [<xref ref-type="bibr" rid="ref1">1</xref>]. The term secondary use of health data is defined by the American Medical Informatics Association as “non-direct care use of PHI [personal health information] including but not limited to analysis, research, quality/safety measurement, public health, payment, provider certification or accreditation, and marketing and other business including strictly commercial activities” [<xref ref-type="bibr" rid="ref2">2</xref>]. Although they can be further categorized [<xref ref-type="bibr" rid="ref3">3</xref>], one of the main types of secondary uses is research.</p>
      <p>Clinical data sharing for research is highly relevant from a scientific, economic, and ethical perspective [<xref ref-type="bibr" rid="ref4">4</xref>]. The overwhelming increment in the volume of available data is directly related with the emergence of a new paradigm of scientific methodology in which massive amounts of data are processed and analyzed for obtaining knowledge through machine learning and data mining algorithms [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>Despite the growth of big data technologies and the use of artificial intelligence, in order to discover new knowledge from data, they must be correct and in a consistent format, which requires a great amount of resources for cleaning, binding, and organizing them. The semantics of data is a key component regarding the aforementioned challenges. To use the electronic health record (EHR) data for different projects, it must maintain its semantics and context, independently of any particular use case. This is especially important in research, where EHR reuse processes are often based on black boxes on which the final data customer is unaware of how the data uploaded to their research database were recorded, extracted, and transformed [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>A common health information standard should be used in both primary and secondary use to share clinical information in a way that it can be unequivocally interpreted, both syntactically and semantically, by 2 or more systems. European Norm/International Organization for Standardization (EN/ISO) 13606 is a health information standard that seeks to define a rigorous and stable architecture for communicating the health records of a single patient, preserving the original clinical meaning. It is based on a dual model that includes a reference model (RM; with the necessary components and their constraints to represent EHR extracts) and an archetype model (AM; for the formalization of clinical-domain concepts according to the RM) [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Archetypes allow the formal representation of the structure of clinical information and its meaning (through terminology binding) so that it is automatically processable by information systems.</p>
      <p>Furthermore, the EN/ISO 13940 norm [<xref ref-type="bibr" rid="ref9">9</xref>] provides a conceptual framework centered in the clinical process. This norm, based on a clinical perspective, defines the system of concepts that are necessary for achieving continuity in the caregiving process, including both the content and the context of the health activities. This ample norm defines the concepts relative to health care actors, health problems, sanitary activities, health care processes, sanitary planification, time-related concepts, responsibilities, and information management.</p>
      <p>Moreover, the Observational Medical Outcomes Partnership Common Data Model (OMOP CDM) defines a common format (data model), as well as a common representation (terminologies, vocabularies, and coding schemes), to allow systematic analyses of disparate observational databases using a library of standard analytic routines that have been written based on the common format [<xref ref-type="bibr" rid="ref10">10</xref>]. The OMOP CDM is considered by several authors as the most adequate data model for sharing data in EHR-based longitudinal studies [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>This paper describes the work carried out between Hospital Clínic de Barcelona (HCB), Hospital 12 de Octubre (H12O), and Instituto de Salud Carlos III (ISCIII), which seeks to consolidate clinical data of hospitalized patients with COVID-19 from different hospitals in joint repositories, structured with EN/ISO 13606 and then normalized according to the OMOP CDM.</p>
      <p>The aim of this study is to design and implement a scalable methodology based on the dual-model paradigm and the use of ontologies to consolidate clinical data from different organizations in a standardized repository for research purposes without loss of meaning. This implies a series of particular objectives such as (1) to define a set of relevant clinical and biochemical variables of patients hospitalized with COVID-19, (2) to model a set of standardized archetypes based on EN/ISO 13606 to communicate such information, (3) to conceptually represent those clinical variables by means of ontologies, (4) to generate EN/ISO 13606–standardized EHR extracts of COVID-19 patients, and (5) to map and transform the source data to create OMOP CDM–compliant tables.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>
              This study was approved by the Hospital Clínic de Barcelona Ethics Committee for Investigation with Drugs (HCB/2018/0573).
          </p>
      </sec>
      <sec>
        <title>Cohort Inclusion Criteria</title>
        <p>We included in this project patients with COVID-19 admitted to the emergency room (ER) or hospitalized between February 17, 2020 (beginning of the first wave in Spain), and February 15, 2022 (end of the sixth wave in Spain).</p>
      </sec>
      <sec>
        <title>Methodology</title>
        <p>The following methodology comprises a series of steps in order to achieve the study’s objectives.</p>
        <sec>
          <title>Step 1: Definition of Clinical Variables, Data Structures, and EN/ISO 13606 Archetypes</title>
          <p>The first step consists in deciding the clinically relevant variables that should be included. Afterward, the data structures must be defined, including the fields, their descriptions, and the standardized terminologies and classifications to be used.</p>
          <p>Since OMOP CDM is intended for secondary use of data (specifically, for biomedical research), its granularity is somewhat reduced when compared to raw data captured in hospitals. For this reason, the Medical Informatics Unit (MIU) at HCB decided to first standardize the data according to EN/ISO 13606, in order to have semantically interoperable EHR extracts with the maximum level of detail.</p>
          <p>Therefore, the MIU at HCB and the Data Science Unit at H12O defined the EN/ISO 13606 archetypes to be used, modeled with the software LinkEHR [<xref ref-type="bibr" rid="ref14">14</xref>] created by VeraTech for Health. The data types used are those established by the standard’s RM.</p>
          <p>This RM has multiple components, including the entry (a result of 1 clinical action, 1 observation, 1 clinical interpretation, or 1 intention) and its elements (the leaf node of the EHR hierarchy, containing a single data value). In our project, the archetypes modeled at the entry level of the RM were the following: diagnosis, episodes, limitation of life-sustaining treatment, administered medication, cumulative drug dose, prescribed medication, movements between units, clinical observations, laboratory observations, patients, health problems, and procedures. These archetypes were registered under a Creative Commons license (ID 2204210968527), so that any user who follows the license terms can share and adapt them [<xref ref-type="bibr" rid="ref15">15</xref>]. <xref rid="figure1" ref-type="fig">Figure 1</xref> shows a mind map of the diagnosis entry archetype as an example.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Mind map of the EN/ISO 13606 “diagnosis” archetype in Spanish, modeled with LinkEHR. The “diagnosis” entry has 6 elements: episode_id, diagnosis, diagnosis_datetime, patient_id, diagnosis_id, and source. Each of them has its corresponding data type. EN/ISO: European Norm/International Organization for Standardization.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44547_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Step 2: Identification of Data Sources and Extract, Transform, and Load</title>
          <p>Afterward, the corresponding data sources must be identified, in order to carry out the extract, transform, and load (ETL) process. In our case, these sources were (1) structured data from HCB’s health information system (HIS), SAP; (2) unstructured data from HCB’s HIS. A collaborative work with Barcelona Supercomputing Center (BSC) allows for the recognition of clinical entities through natural language processing and its extraction as normalized structured data; (3) outpatient setting structured data from Agència de Qualitat i Avaluació Sanitàries de Catalunya.</p>
          <p>Since the last 2 sources come from separate projects whose description is besides the objective of this paper, we will focus on the first one. Archetypes created in the previous step were used as templates for identifying data in the aforementioned sources. Periodic meetings were held with the Information Technology Department at HCB to identify the location of the data and the transformations needed to obtain the structured data defined in the previous step. Once this was achieved, the tables were loaded into a MySQL database hosted on a dedicated server of the MIU.</p>
        </sec>
        <sec>
          <title>Step 3: Creation of EN/ISO 13606 EHR Extracts From Source Data</title>
          <p>Once the final data set is obtained, data must be transformed to create EHR extracts normalized according to EN/ISO 13606. This transformation includes mapping of local variables to standardized nomenclatures and classifications (Systematized Nomenclature of Medicine—Clinical Terms (SNOMED CT), International Classification of Diseases 10—Clinical Modification (ICD-10-CM), Logical Observation Identifiers Names and Codes (LOINC)), assigning readable descriptions to local codes, and categorizing certain concepts (eg, grouping hospital units according to the level of care).</p>
          <p>This process is performed by mapping archetypes to the implicated information systems, without the need to modify them. This approach allows the automation of data extraction and the reuse of this methodology for other use cases with very little effort, which constitutes one of the great advantages of dual-model strategies.</p>
          <p>In our case, we carried out this process with the help of VeraTech for Health, our technical partners, using LinkEHR, thus creating extracts on our dedicated server and constituting an EN/ISO 13606 standardized clinical repository. <xref rid="figure2" ref-type="fig">Figure 2</xref> shows a test example of an EN/ISO 13606 EHR extract (without real-patient data). In this extract, the ICD-10-CM code H40.9 (unspecified glaucoma) is being communicated, alongside its date and time of record and the ID of the clinical episode it pertains to.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Anonymized, normalized EN/ISO 13606 EHR extract of diagnosis in Spanish. EHR: electronic health record; EN/ISO: European Norm/International Organization for Standardization.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44547_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Step 4: Creation of Ontologies</title>
          <p>Traditionally, clinical concepts and the relationships between them have been poorly developed in HISs. The MIU at HCB developed OntoCR, an ontology-based clinical repository, conforming to EN/ISO 13606 standard [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. The use of ontologies allows for the definition of a conceptual architecture centered on the representation of the clinical process, while the use of EN/ISO 13606 allows syntactic and semantic interoperability between systems. EN/ISO 13940 was also used to define the generic concepts needed to achieve continuity of care, representing both the content and the context of the health care services.</p>
          <p>One of the main advantages of ontologies is their flexibility to perform changes with minimum use of resources, adapting to an ever-changing environment. Likewise, ontologies allow the addition of conceptual layers, thus mapping locally defined concepts to health information standards, facilitating the communication of information without loss of meaning.</p>
          <p>A relational database (OWL-DB) is used for storing ontologies and instantiated data, designed according to the Web Ontology Language (OWL) specification [<xref ref-type="bibr" rid="ref18">18</xref>]. The ontologies in this project were created using Protégé, a free, open-source ontology editor created by Stanford University that fully supports OWL and Resource Description Framework (RDF) specifications from the World Wide Web Consortium [<xref ref-type="bibr" rid="ref19">19</xref>]. A plug-in developed by our team, the OWL-DB plugin, connects Protégé with the OWL-DB module at the storage level.</p>
          <p>These ontologies were conceptualized in 3 different layers. The first one describes the concepts modeled in the archetypes, with the classes and properties that describe the data structure defined in the first phase. Data types according to the EN/ISO 13606 RM were used.</p>
          <p>In the next layer, we used a locally created ontology that reproduces the EN/ISO 13606 RM and AM. By creating an additional ontology that maps the archetypal concepts to the EN/ISO 13606 model, we structured our data according to the standard. In this layer, each entry-level archetype is represented in a separate ontology.</p>
          <p>As with EN/ISO 13606, we created an ontology that models the OMOP CDM and afterward mapped archetypal concepts to the corresponding meta-class of the standard. So, the third layer consists of ontologies for each archetype that reproduce concepts according to the OMOP CDM structure. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows these 3 ontologies. The left image (ontology of the AM of diagnosis) depicts the class “Diagnosis” with its properties diagnosis, diagnosis_id, episode, diagnosis_datetime, source, and patient_id. In the upper-right image, a new ontology was created where the class “Diagnosis” was modeled as a subclass of “iso13606: Entry,” thus inheriting its properties defined in the RM. Finally, in the lower right image, a third ontology maps the property diagnosis with OMOP CDM’s metaclass “condition_source_value.”</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Ontologies of the archetype model of diagnosis (left) and its mapping to the EN/ISO 13606 structure (upper right) and the OMOP CDM (lower right) in Spanish, edited with Protégé software. EN/ISO: European Norm/International Organization for Standardization; OMOP CDM: Observational Medical Outcomes Partnership Common Data Model.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44547_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>Afterward, these ontologies must be loaded into a production environment of OntoCR so as to generate the structure that can receive instantiated data of patients and store it.</p>
        </sec>
        <sec>
          <title>Step 5: Integration of EN/ISO 13606 Extracts Into the Ontology-Based Clinical Repository and Extraction of Data as OMOP CDM–Compliant Tables</title>
          <p>Once the ontological structure is ready to receive the data, the EHR extracts must be inserted into the repository, thus incorporating the normalized, instantiated data. We initially explored the possibility of adapting a preexisting application programming interface (API) that was used for the same purpose in a previous project. However, the resources needed for its adaptation were significantly elevated, and its scalability reduced. Therefore, we decided to work on an application that identifies each archetype node within the extract and inserts it into its counterpart in the OWL file. This is facilitated by the representation in the ontologies of each archetype, their nodes, and the data types used (compliant with EN/ISO 13606).</p>
          <p>Finally, data stored in the ontology-based clinical repository needs to be extracted through SPARQL queries, a language used for graph databases. Since archetypal concepts have been previously mapped to the OMOP CDM, by performing these queries, the extraction process is simplified. If there are cases in which data needs to be transformed to fit the CDM, such transformations can be included in the queries or carried out via SQL queries once relational tables are obtained.</p>
          <p>In <xref rid="figure4" ref-type="fig">Figure 4</xref>, a SPARQL query for extracting data for the OMOP CDM PERSON table is shown. Attributes that are not present in the ontological repository must still be included in the SELECT clause so as to create the corresponding table column without any instantiated data. Since EN/ISO 13606 data types were used in the extracts and modeled in the ontologies, they were also represented in the queries (see the lower lines of SPARQL code).</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>SPARQL query for the “Person” table of the OMOP CDM. OMOP CDM: Observational Medical Outcomes Partnership Common Data Model.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44547_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>Data anonymization is performed by the IT department at this level using an institutional software solution. This way, EN/ISO 13606 extracts contain identified data that can be used for primary uses, while OMOP CDM tables are anonymized for secondary uses.</p>
          <p>Once obtained, the anonymized data can be consolidated in a joint OMOP CDM repository with other institutions that use the same standard (in our case, H12O). OMOP CDM has a large number of tables, divided into 6 groups: standardized clinical data, standardized health system data, standardized derived elements, standardized health economics, standardized metadata, and standardized vocabularies. Our OMOP CDM repository contains the following tables, which are part of the standardized clinical data: “Condition_occurrence,” “Death,” “Device_exposure,” “Drug_exposure,” “Measurement,” “Observation,” “Observation_period,” “Person,” “Visit_detail,” and “Visit_occurrence.”</p>
          <p><xref rid="figure5" ref-type="fig">Figure 5</xref> shows an overview of the whole process. The knowledge modeling starts with the creation of EN/ISO 13606 archetypes based on clinical concepts, which are then represented in ontologies that map them to EN/ISO 13606 RM and OMOP CDM. These ontologies are uploaded to OntoCR without instantiated patient data yet.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>General overview of the process. Red arrows indicate data flow, while blue arrows indicate knowledge-related processes. Numbers indicate the deliverables within each step. EHR: electronic health record; EN/ISO: European Norm/International Organization for Standardization; ETL: extract, transform, and load; H12O: Hospital 12 de Octubre; HCB: Hospital Clínic de Barcelona; OMOP: Observational Medical Outcomes Partnership.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44547_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The data-related processes begin with the archetype-based extraction of raw data from our local system into a MySQL database and its transformation to create EN/ISO EHR extracts, which are then inserted into OntoCR via an application specifically developed for this project. SPARQL queries are performed against this ontological repository to obtain an OMOP CDM repository that is consolidated with H12O in a joint one.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Methodology</title>
        <p>The main deliverable of this project is the methodology described in the previous section. By following the aforementioned steps, any health care institution can go from local raw data to standardized, semantically interoperable EN/ISO 13606 and OMOP repositories. This methodology also led to the creation of 12 EN/ISO 13606-standardized archetypes that model important clinical variables in the ER and hospitalization settings, allowing the reuse of clinical information by using it in accordance with the Creative Commons terms.</p>
      </sec>
      <sec>
        <title>Ontologies</title>
        <p>Another interesting result of this study is the development of the ontologies that represent OMOP CDM, as well as their mappings to EN/ISO 13606 AM and RM. This process was carried out by members of the MIU at HCB after carefully reading the pertinent documentation of these standards and designing the optimal way of using them to represent clinical concepts.</p>
        <p>Furthermore, representing clinical variables by means of ontologies is another way of reusing clinical information. With the creation of new ontologies for each project at HCB, where we have developed the ontology-based clinical repository OntoCR, we continue to extend our clinical knowledge representation.</p>
      </sec>
      <sec>
        <title>EN/ISO 13606 Extracts</title>
        <p><xref ref-type="table" rid="table1">Table 1</xref> shows the correspondence between EHR archetypes, OMOP CDM tables, number of extracts created throughout the study, and the number of COVID-19 patients they pertain to. We have included the diagnoses recorded in the episodes of the study period as well as the historical ones. Health problem entries are part of the aforementioned project with BSC to extract clinical entities from unstructured texts through natural language processing, so they will not be included in this table.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Correspondence between EHR<sup>a</sup> archetypes, OMOP CDM<sup>b</sup> tables, number of extracts created throughout the study, and the number of patients they pertain to.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="310"/>
            <col width="270"/>
            <col width="240"/>
            <col width="180"/>
            <thead>
              <tr valign="bottom">
                <td>EHR archetype</td>
                <td>OMOP CDM table</td>
                <td>EN/ISO<sup>c</sup> 13606 extracts, n</td>
                <td>Patients, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Patient</td>
                <td>“Person”</td>
                <td>6803</td>
                <td>6803</td>
              </tr>
              <tr valign="top">
                <td>Episode</td>
                <td>“Visit_occurence”</td>
                <td>13,938</td>
                <td>6791</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis</td>
                <td>“Condition_occurrence”</td>
                <td>190,878</td>
                <td>6799</td>
              </tr>
              <tr valign="top">
                <td>Cumulative drug dose</td>
                <td>“Drug_exposure”</td>
                <td>262,770</td>
                <td>5630</td>
              </tr>
              <tr valign="top">
                <td>Administered medication</td>
                <td>“Drug_exposure”</td>
                <td>262,770</td>
                <td>5630</td>
              </tr>
              <tr valign="top">
                <td>Prescribed medication</td>
                <td>“Drug_exposure”</td>
                <td>341,986</td>
                <td>5639</td>
              </tr>
              <tr valign="top">
                <td>Movements between units</td>
                <td>“Visit_detail”</td>
                <td>47,817</td>
                <td>6791</td>
              </tr>
              <tr valign="top">
                <td>Clinical observation</td>
                <td>“Measurement”</td>
                <td>6,736,745</td>
                <td>5973</td>
              </tr>
              <tr valign="top">
                <td>Laboratory observation</td>
                <td>“Measurement”</td>
                <td>3,392,873</td>
                <td>6001</td>
              </tr>
              <tr valign="top">
                <td>Limitation of life-sustaining treatment</td>
                <td>“Observation”</td>
                <td>1298</td>
                <td>1142</td>
              </tr>
              <tr valign="top">
                <td>Procedure</td>
                <td>“Procedure_occurrence”</td>
                <td>19,861</td>
                <td>4994</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>EHR: electronic health record.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>OMOP CDM: Observational Medical Outcomes Partnership Common Data Model.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>EN/ISO: European Norm/International Organization for Standardization.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>OMOP CDM–Compliant Clinical Tables</title>
        <p>We still do not have the final number of records in our OMOP tables, since the initial approach of adapting the preexisting API had to be replaced by the creation of the application that inserts data from the extracts into the ontologies. However, an OMOP database for a random small subset of patients was successfully created to test the queries and validate the methodology. This was performed using a locally developed Protégé plugin (“OntoLoad”) that imports a set of data from a relational database into the ontologies [<xref ref-type="bibr" rid="ref17">17</xref>]. <xref ref-type="table" rid="table2">Table 2</xref> describes the OMOP tables that were created.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>OMOP CDM<sup>a</sup>-compliant clinical tables created for a random small subset of patients.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="380"/>
            <col width="290"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td>OMOP CDM table</td>
                <td>Patients, n</td>
                <td>Records, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>“Condition occurrence”</td>
                <td>121</td>
                <td>864</td>
              </tr>
              <tr valign="top">
                <td>“Death”</td>
                <td>110</td>
                <td>110</td>
              </tr>
              <tr valign="top">
                <td>“Device_exposure”</td>
                <td>3</td>
                <td>56</td>
              </tr>
              <tr valign="top">
                <td>“Drug_exposure”</td>
                <td>106</td>
                <td>5609</td>
              </tr>
              <tr valign="top">
                <td>“Measurement”</td>
                <td>3</td>
                <td>2091</td>
              </tr>
              <tr valign="top">
                <td>“Observation”</td>
                <td>3</td>
                <td>195</td>
              </tr>
              <tr valign="top">
                <td>“Observation_period”</td>
                <td>897</td>
                <td>897</td>
              </tr>
              <tr valign="top">
                <td>“Person”</td>
                <td>922</td>
                <td>922</td>
              </tr>
              <tr valign="top">
                <td>“Visit_detail”</td>
                <td>250</td>
                <td>772</td>
              </tr>
              <tr valign="top">
                <td>“Visit_occurrence”</td>
                <td>897</td>
                <td>971</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>OMOP CDM: Observational Medical Outcomes Partnership Common Data Model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>This study proposes a methodology for standardizing clinical data, thus allowing its reuse without any change in the meaning of the modeled concepts. Although the focus of this paper is health research, our methodology suggests that the data be initially standardized according to EN/ISO 13606 to obtain EHR extracts with a high level of granularity that can be used for any purpose, as previous studies have suggested [<xref ref-type="bibr" rid="ref20">20</xref>]. Afterward, its transformation to OMOP CDM–compliant tables allows its consolidation in joint repositories for research purposes.</p>
        <p>Although EN/ISO 13606 was chosen because of the operational mechanisms it offers for data exchange, due to the flexibility and standard-agnostic nature of our methodology, there is complete independence regarding any specific standard. Thus, by modeling ontologies of other standards and mapping them to local variables, we may, for example, carry out transformations between EN/ISO 13606, OpenEHR [<xref ref-type="bibr" rid="ref21">21</xref>], Fast Healthcare Interoperability Resources (FHIR) [<xref ref-type="bibr" rid="ref22">22</xref>], OMOP CDM, and Informatics for Integrating Biology and the Bedside (i2b2) [<xref ref-type="bibr" rid="ref23">23</xref>] with the minimum use of resources and without the need for changes in the database structure. Health information standards such as EN/ISO 13606 and OpenEHR allow the modeling and formalization of clinical knowledge through their RMs and archetypes [<xref ref-type="bibr" rid="ref24">24</xref>], and ontologies are precisely a tool for carrying out such tasks. This is what makes them ideal in the context of an implementation of a dual-model strategy, allowing the representation of concepts in the health domain, its standardization, and the storage of instantiated patient data.</p>
        <p>Furthermore, ontologies provide several advantages for the conceptualization of entities in a domain. It explicitly represents domain knowledge, allows the application of inference processes, enables the reuse of domain knowledge, allows data aggregation, and detects new associations between concepts [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>It is clear for us that loading normalized data onto clinical repositories (instead of ad hoc data loading) provides many benefits. It is possible to reuse the same interoperability standards used in health care, adapting them to this new paradigm [<xref ref-type="bibr" rid="ref25">25</xref>]. This approach allows the availability of clinical data for further single- or multicenter research.</p>
        <p>We would like to highlight the vital importance of continuous collaborative research. This study is framed within a continued line of research since 2009 between HCB, ISCIII, and H12O. In this line of collaborative research, a standardized and transparent process has been designed and implemented for obtaining standardized data models for research from EHR raw data. Hence, in the first stage, the basis for a semantically interoperable clinical information management system based on EN/ISO 13606 was defined, proving that clinical information residing in heterogeneous systems could be normalized, combined, and communicated without loss of meaning. In the second stage, a common information model that reflects the clinical process and the relationships between the clinical records components was developed. In the third stage, a normalized information model based on EN/ISO 13606 archetypes was implemented and applied to local information systems for specific clinical use cases. With this model, it is possible to construct and order information recovered from these complex systems for the exchange of integral health and social information of patients and to use it for secondary purposes.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Many of the requisites of clinical data repositories for primary use are common to those for secondary use, such as normalized clinical information models, controlled terminologies, identification of actors, and contextual information. Developments carried out for primary use repositories are also profitable for secondary uses, and the progresses derived from secondary uses accelerate the advances in shared clinical records. A lot of work has been reported in this field throughout the globe in the last years, which has led to developing policies, repository models and its application in the form of competitive projects [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <p>It is very usual for researchers to resort to the generation of their own data for research and its manual introduction into data management systems. It is also quite common for them to use general purpose tools, particularly spreadsheets, as data management systems [<xref ref-type="bibr" rid="ref28">28</xref>], while there is perception of a high need of additional support for the analysis of high volumes of data. This represents a significant problem, since these applications cannot guarantee the consistency of data, and they present difficulties for sharing and consolidating data and a limited capability of data exploitation.</p>
        <p>Different methodologies have been proposed to create OMOP repositories from raw data. Some approaches are based on a simple mapping of local variables to their OMOP CDM counterparts, an alignment of vocabularies using the Athena tool provided by OHDSI and an ETL process through SQL scripts [<xref ref-type="bibr" rid="ref29">29</xref>]. Other authors have proposed transforming source data to RDF, carrying out a semantic mapping (in some cases, using an ontological representation of OMOP CDM), and loading it to a data store [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Likewise, other standard-agnostic approaches have been reported in the literature. The ongoing INFOBANCO project of the Madrid Region [<xref ref-type="bibr" rid="ref32">32</xref>] seeks to create a platform for the management, persistence, exchange, and reuse of health data focused on applying each health information standard for the purpose it was intended to, offering multiple interoperability and exploitation services suited for specific use cases [<xref ref-type="bibr" rid="ref24">24</xref>]. Furthermore, the 3-pillar strategy of the Swiss Personalized Health Network [<xref ref-type="bibr" rid="ref33">33</xref>] pursues a semantically interoperable clinical data landscape based on a multidimensional encoding of concepts, an RDF-based storage and transport of the instances of these concepts and a conversion of RDF to any target data model.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>This study has many strengths that are worth mentioning. On the one hand, it describes a real-world collaborative effort between 3 health care institutions in Spain to model, share, and consolidate standardized patient data. Furthermore, the standard-agnostic nature of the proposed methodology leads to a significant scalability, allowing transformation between different health information standards and common data models. The software used in our methodology (LinkEHR, Protégé, and Liferay) either have a free version or are open source, which make them accessible to low-income areas and institutions with limited funding for interoperability projects.</p>
        <p>We must also mention the limitations of this study. First of all, the ontology-based clinical repository used in our institution was developed throughout many years, and it might not be a suitable approach for institutions that seek a rapid implementation of a methodology. This can limit the external validity of the study. Moreover, since the tool to insert data from standardized extracts into the ontologies is not ready yet, we still have not completed the creation of OMOP CDM tables. However, an OMOP CDM database for a small subset of patients was successfully created to test the queries and validate the methodology.</p>
      </sec>
      <sec>
        <title>Next Steps</title>
        <p>The MIU team at HCB is working on creating the ontological representation of different health information standards (FHIR and OpenEHR) and CDMs (i2b2, International Cancer Genome Consortium Accelerating Research in Genomic Oncology (ICGC Argo) [<xref ref-type="bibr" rid="ref34">34</xref>], and Clinical Data Interchange Standards Consortium (CDISC) [<xref ref-type="bibr" rid="ref35">35</xref>]). This will extend the current metamodel and allow us to carry out multistandard transformations, which will also help us compare the performance of such standards for different scenarios.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Semantic interoperability plays a very important role within HISs, providing meaning and clinical context to the clinical information and allowing for better clinical decision-making and research. This study has demonstrated that ontologies constitute a valuable approach for knowledge representation and standardization of health information in a standard-agnostic manner. With the proposed methodology, institutions can go from local raw data to standardized, semantically interoperable EN/ISO 13606 and OMOP repositories.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AM</term>
          <def>
            <p>archetype model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BSC</term>
          <def>
            <p>Barcelona Supercomputing Center</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CDISC</term>
          <def>
            <p>Clinical Data Interchange Standards Consortium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EN/ISO 13606</term>
          <def>
            <p>European Norm/International Organization for Standardization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ER</term>
          <def>
            <p>emergency room</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ETL</term>
          <def>
            <p>extract, transform, and load</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">FHIR</term>
          <def>
            <p>Fast Healthcare Interoperability Resources</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">H12O</term>
          <def>
            <p>Hospital 12 de Octubre</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">HCB</term>
          <def>
            <p>Hospital Clínic de Barcelona</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">HIS</term>
          <def>
            <p>health information system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">i2b2</term>
          <def>
            <p>Informatics for Integrating Biology and the Bedside</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">ICD-10-CM</term>
          <def>
            <p>International Classification of Diseases 10—Clinical Modification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">ICGC Argo</term>
          <def>
            <p>International Cancer Genome Consortium Accelerating Research in Genomic Oncology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">ISCIII</term>
          <def>
            <p>Instituto de Salud Carlos III</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">LOINC</term>
          <def>
            <p>Logical Observation Identifiers Names and Codes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">MIU</term>
          <def>
            <p>Medical Informatics Unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">OMOP CDM</term>
          <def>
            <p>Observational Medical Outcomes Partnership Common Data Model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">OWL</term>
          <def>
            <p>Web Ontology Language</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">OWL-DB</term>
          <def>
            <p>Web Ontology Language database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb22">RDF</term>
          <def>
            <p>Resource Description Framework</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb23">RM</term>
          <def>
            <p>reference model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb24">SNOMED CT</term>
          <def>
            <p>Systematized Nomenclature of Medicine—Clinical Terms</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study is also framed within the Spanish Secretary of State for Telecommunications and Digital Infrastructure’s “Plan de Impulso de las Tecnologías del Lenguaje” (Plan TL). We would like to thank the Instituto de Salud Carlos III (ISCIII), VeraTech For Health, and Barcelona Supercomputing Center for their collaboration on this project. This work was supported by the ISCIII and cofunded by the European Union (grant PI18/00890, PI18/00981, and PI18CIII/00019).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jungkunz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Köngeter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mehlis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Winkler</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Schickhardt</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Secondary use of clinical data in data-gathering, non-interventional research or learning activities: definition, types, and a framework for risk assessment</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e26631</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e26631/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26631</pub-id>
          <pub-id pub-id-type="medline">34100760</pub-id>
          <pub-id pub-id-type="pii">v23i6e26631</pub-id>
          <pub-id pub-id-type="pmcid">PMC8241435</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Safran</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bloomrosen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hammond</surname>
              <given-names>WE</given-names>
            </name>
            <name name-style="western">
              <surname>Labkoff</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Markel-Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Detmer</surname>
              <given-names>DE</given-names>
            </name>
            <collab>Expert Panel</collab>
          </person-group>
          <article-title>Toward a national framework for the secondary use of health data: an American Medical Informatics Association white paper</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2007</year>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17077452"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M2273</pub-id>
          <pub-id pub-id-type="medline">17077452</pub-id>
          <pub-id pub-id-type="pii">M2273</pub-id>
          <pub-id pub-id-type="pmcid">PMC2329823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robertson</surname>
              <given-names>ARR</given-names>
            </name>
            <name name-style="western">
              <surname>Nurmatov</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Sood</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Cresswell</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A systematic scoping review of the domains and innovations in secondary uses of digitised health-related data</article-title>
          <source>J Innov Health Inform</source>
          <year>2016</year>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>611</fpage>
          <lpage>619</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://informatics.bmj.com/lookup/pmidlookup?view=long&#38;pmid=28059695"/>
          </comment>
          <pub-id pub-id-type="doi">10.14236/jhi.v23i3.841</pub-id>
          <pub-id pub-id-type="medline">28059695</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ohmann</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Banzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Canham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Battaglia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matei</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ariyo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Becnel</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bierer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bowers</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Clivio</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dias</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Druml</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Faure</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fenner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Galvez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ghersi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gluud</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Groves</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Houston</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Karam</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Knowles</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Krleža-Jerić</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kubiak</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kuchinke</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kush</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lukkarinen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Marques</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Newbigging</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Callaghan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ravaud</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schlünder</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Shanahan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sitter</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Spalding</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tudur-Smith</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>van Reusel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>van Veen</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Visser</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Demotes-Mainard</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Sharing and reuse of individual participant data from clinical trials: principles and recommendations</article-title>
          <source>BMJ Open</source>
          <year>2017</year>
          <volume>7</volume>
          <issue>12</issue>
          <fpage>e018647</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=29247106"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2017-018647</pub-id>
          <pub-id pub-id-type="medline">29247106</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2017-018647</pub-id>
          <pub-id pub-id-type="pmcid">PMC5736032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Kurbanoğlu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Al</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Erdoğan</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Tonta</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Uçak</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The fourth paradigm—data-intensive scientific discovery</article-title>
          <source>E-Science and Information Management. IMCW 2012. Communications in Computer and Information Science, vol 317</source>
          <year>2012</year>
          <publisher-loc>Berlin</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedrera-Jiménez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Barrio</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rubio-Mayo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tato-Gómez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz-Bermúdez</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Bernal-Sobrino</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz-Carrero</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano-Balazote</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>TransformEHRs: a flexible methodology for building transparent ETL processes for EHR reuse</article-title>
          <source>Methods Inf Med</source>
          <year>2022</year>
          <volume>61</volume>
          <issue>S 02</issue>
          <fpage>e89</fpage>
          <lpage>e102</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0042-1757763"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0042-1757763</pub-id>
          <pub-id pub-id-type="medline">36220109</pub-id>
          <pub-id pub-id-type="pmcid">PMC9788916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Health informatics—electronic health record communication—Part 1: Reference model</article-title>
          <source>ISO</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iso.org/standard/67868.html">https://www.iso.org/standard/67868.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Health informatics—electronic health record communication—Part 2: Archetype interchange specification</article-title>
          <source>ISO</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iso.org/standard/62305.html">https://www.iso.org/standard/62305.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>ISO 13940:2015—Health informatics—system of concepts to support continuity of care</article-title>
          <source>ISO</source>
          <access-date>2022-06-04</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iso.org/standard/58102.html">https://www.iso.org/standard/58102.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>OHDSI</collab>
          </person-group>
          <source>The Book of OHDSI: Observational Health Data Sciences and Informatics</source>
          <year>2019</year>
          <publisher-loc>North Bethesda, MD</publisher-loc>
          <publisher-name>OHDSI</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duke</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Huser</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Schuemie</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Suchard</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>ICK</given-names>
            </name>
            <name name-style="western">
              <surname>Rijnbeek</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>van der Lei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Norén</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>PlE</given-names>
            </name>
            <name name-style="western">
              <surname>Madigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
          </person-group>
          <article-title>Observational Health Data Sciences and Informatics (OHDSI): opportunities for observational researchers</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2015</year>
          <volume>216</volume>
          <fpage>574</fpage>
          <lpage>578</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26262116"/>
          </comment>
          <pub-id pub-id-type="medline">26262116</pub-id>
          <pub-id pub-id-type="pmcid">PMC4815923</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Overhage</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Hartzema</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>PE</given-names>
            </name>
          </person-group>
          <article-title>Validation of a common data model for active safety surveillance research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2012</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>54</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22037893"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000376</pub-id>
          <pub-id pub-id-type="medline">22037893</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000376</pub-id>
          <pub-id pub-id-type="pmcid">PMC3240764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tenenbaum</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walden</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Evaluating common data models for use with a longitudinal community registry</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <volume>64</volume>
          <fpage>333</fpage>
          <lpage>341</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30153-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.10.016</pub-id>
          <pub-id pub-id-type="medline">27989817</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30153-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6810649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maldonado</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Moner</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Boscá</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fernández-Breis</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Angulo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>LinkEHR-Ed: a multi-reference model archetype editor based on formal semantics</article-title>
          <source>Int J Med Inform</source>
          <year>2009</year>
          <volume>78</volume>
          <issue>8</issue>
          <fpage>559</fpage>
          <lpage>570</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2009.03.006</pub-id>
          <pub-id pub-id-type="medline">19386540</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(09)00051-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maggio</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Stranack</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Understanding Creative Commons</article-title>
          <source>Acad Med</source>
          <year>2020</year>
          <volume>95</volume>
          <issue>2</issue>
          <fpage>322</fpage>
          <pub-id pub-id-type="doi">10.1097/ACM.0000000000003031</pub-id>
          <pub-id pub-id-type="medline">31599759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lozano-Rubí</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz Carrero</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano Balazote</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pastor</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>OntoCR: a CEN/ISO-13606 clinical repository based on ontologies</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <volume>60</volume>
          <fpage>224</fpage>
          <lpage>233</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)00029-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.02.007</pub-id>
          <pub-id pub-id-type="medline">26911524</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)00029-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lozano-Rubí</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>A Metamodel for Clinical Data Integration: Basis for a New EHR Model Driven by Ontologies</source>
          <year>2017</year>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tdx.cat/bitstream/handle/10803/399855/rlr1de1.pdf?sequence=1">https://www.tdx.cat/bitstream/handle/10803/399855/rlr1de1.pdf?sequence=1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>OWL Web Ontology Language Reference</article-title>
          <source>OWL</source>
          <access-date>2022-05-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.w3.org/TR/owl-features">http://www.w3.org/TR/owl-features</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Musen</surname>
              <given-names>MA</given-names>
            </name>
            <collab>Protégé Team</collab>
          </person-group>
          <article-title>The Protégé project: a look back and a look forward</article-title>
          <source>AI Matters</source>
          <year>2015</year>
          <volume>1</volume>
          <issue>4</issue>
          <fpage>4</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27239556"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2757001.2757003</pub-id>
          <pub-id pub-id-type="medline">27239556</pub-id>
          <pub-id pub-id-type="pmcid">PMC4883684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedrera-Jiménez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García-Barrio</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz-Rojo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Terriza-Torres</surname>
              <given-names>AI</given-names>
            </name>
            <name name-style="western">
              <surname>López-Jiménez</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Calvo-Boyero</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jiménez-Cerezo</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Blanco-Martínez</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Roig-Domínguez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz-Bermúdez</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Bernal-Sobrino</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano-Balazote</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz-Carrero</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Obtaining EHR-derived datasets for COVID-19 research within a short time: a flexible methodology based on detailed clinical models</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <volume>115</volume>
          <fpage>103697</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00026-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103697</pub-id>
          <pub-id pub-id-type="medline">33548541</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00026-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7857038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Beale</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Heard</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The openEHR Foundation</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2005</year>
          <volume>115</volume>
          <fpage>153</fpage>
          <lpage>173</lpage>
          <pub-id pub-id-type="medline">16160223</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayaz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pasha</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Alzahrani</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Budiarto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stiawan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The fast health interoperability resources (FHIR) standard: systematic literature review of implementations, applications, challenges and opportunities</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>e21929</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/7/e21929/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21929</pub-id>
          <pub-id pub-id-type="medline">34328424</pub-id>
          <pub-id pub-id-type="pii">v9i7e21929</pub-id>
          <pub-id pub-id-type="pmcid">PMC8367140</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mendis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chueh</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Serving the enterprise and beyond with informatics for integrating biology and the bedside (i2b2)</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>124</fpage>
          <lpage>130</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20190053"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.000893</pub-id>
          <pub-id pub-id-type="medline">20190053</pub-id>
          <pub-id pub-id-type="pii">17/2/124</pub-id>
          <pub-id pub-id-type="pmcid">PMC3000779</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedrera-Jiménez</surname>
              <given-names>M</given-names>
            </name>
            <collab>Spanish Expert Group on EHR standards</collab>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Beale</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz-Carrero</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano-Balazote</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Can OpenEHR, ISO 13606 and HL7 FHIR work together? An agnostic perspective for the selection and application of EHR standards from Spain</article-title>
          <source>TechRxiv. Preprint posted online on May 25, 2022</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.techrxiv.org/articles/preprint/Can_OpenEHR_ISO_13606_and_HL7_FHIR_work_together_An_agnostic_perspective_for_the_selection_and_application_of_EHR_standards_from_Spain/19746484/1"/>
          </comment>
          <pub-id pub-id-type="doi">10.36227/techrxiv.19746484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haarbrandt</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tute</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Marschollek</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Automated population of an i2b2 clinical data warehouse from an openEHR-based data repository</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <volume>63</volume>
          <fpage>277</fpage>
          <lpage>294</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30084-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.08.007</pub-id>
          <pub-id pub-id-type="medline">27507090</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30084-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Beebe</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carrell</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dligach</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Endle</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Huff</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Kaggal</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Marchant</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Masanz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Oniki</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rea</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Stancl</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Solbrig</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Suesse</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Westberg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Normalization and standardization of electronic health records for high-throughput phenotyping: the SHARPn consortium</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>e2</issue>
          <fpage>e341</fpage>
          <lpage>e348</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24190931"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001939</pub-id>
          <pub-id pub-id-type="medline">24190931</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-001939</pub-id>
          <pub-id pub-id-type="pmcid">PMC3861933</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cimino</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ayres</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>The clinical research data repository of the US National Institutes of Health</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2010</year>
          <volume>160</volume>
          <issue>Pt 2</issue>
          <fpage>1299</fpage>
          <lpage>1303</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20841894"/>
          </comment>
          <pub-id pub-id-type="medline">20841894</pub-id>
          <pub-id pub-id-type="pmcid">PMC3408090</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Brockenbrough</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Minie</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Fuller</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tarczy-Hornoch</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Issues in biomedical research data management and analysis: needs and barriers</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2007</year>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>478</fpage>
          <lpage>488</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17460139"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M2114</pub-id>
          <pub-id pub-id-type="medline">17460139</pub-id>
          <pub-id pub-id-type="pii">M2114</pub-id>
          <pub-id pub-id-type="pmcid">PMC2244904</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paris</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lamer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Parrot</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Transformation and evaluation of the MIMIC database in the OMOP common data model: development and usability study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>12</issue>
          <fpage>e30970</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/12/e30970/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30970</pub-id>
          <pub-id pub-id-type="medline">34904958</pub-id>
          <pub-id pub-id-type="pii">v9i12e30970</pub-id>
          <pub-id pub-id-type="pmcid">PMC8715361</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pacaci</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gonul</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sinaci</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Yuksel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Laleci Erturkmen</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>A semantic transformation methodology for the secondary use of observational healthcare data in postmarketing safety studies</article-title>
          <source>Front Pharmacol</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>435</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29760661"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fphar.2018.00435</pub-id>
          <pub-id pub-id-type="medline">29760661</pub-id>
          <pub-id pub-id-type="pmcid">PMC5937227</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Depraetere</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>De Roo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mels</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>De Vloed</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Twagirumukiza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Colaert</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Semantic processing of EHR data for clinical research</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <volume>58</volume>
          <fpage>247</fpage>
          <lpage>259</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00231-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.10.009</pub-id>
          <pub-id pub-id-type="medline">26515501</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00231-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>infobank</article-title>
          <source>Comunidad de Madrid</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cpisanidadcm.org/infobanco/">https://cpisanidadcm.org/infobanco/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaudet-Blavignac</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Raisaro</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Touré</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Österle</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Crameri</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lovis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A national, semantic-driven, three-pillar strategy to enable health data secondary usage interoperability for research within the Swiss personalized health network: methodological study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>6</issue>
          <fpage>e27591</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/6/e27591/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27591</pub-id>
          <pub-id pub-id-type="medline">34185008</pub-id>
          <pub-id pub-id-type="pii">v9i6e27591</pub-id>
          <pub-id pub-id-type="pmcid">PMC8277320</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>Accelerating research in genomic oncology</article-title>
          <source>ICGC ARGO</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.icgc-argo.org/">https://www.icgc-argo.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <article-title>Standards</article-title>
          <source>CDISC</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdisc.org/standards">https://www.cdisc.org/standards</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
