<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e43847</article-id>
      <article-id pub-id-type="pmid">36943344</article-id>
      <article-id pub-id-type="doi">10.2196/43847</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Standardized Clinical Data Harmonization Pipeline for Scalable AI Application Deployment (FHIR-DHP): Validation and Usability Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bartschke</surname>
            <given-names>Alexander</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gupta</surname>
            <given-names>Ketan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>Elena</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9396-2078</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Kienast</surname>
            <given-names>Manuel</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5522-6619</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Medawar</surname>
            <given-names>Evelyn</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>AICURA Medical GmbH</institution>
            <addr-line>Bessemerstr 22</addr-line>
            <addr-line>Berlin, 12103</addr-line>
            <country>Germany</country>
            <phone>49 173 9449677</phone>
            <email>evelyn.medawar@aicura-medical.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5011-8275</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Reinelt</surname>
            <given-names>Janis</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0321-8334</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Merola</surname>
            <given-names>Alberto</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0900-963X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Klopfenstein</surname>
            <given-names>Sophie Anne Ines</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8470-2258</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Flint</surname>
            <given-names>Anne Rike</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1414-5812</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Heeren</surname>
            <given-names>Patrick</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9356-2296</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Poncette</surname>
            <given-names>Akira-Sebastian</given-names>
          </name>
          <degrees>MD, PD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4627-7016</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Balzer</surname>
            <given-names>Felix</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1575-2056</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Beimes</surname>
            <given-names>Julian</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8602-2838</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>von Bünau</surname>
            <given-names>Paul</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6806-0718</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Chromik</surname>
            <given-names>Jonas</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5709-4381</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Arnrich</surname>
            <given-names>Bert</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8380-7667</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author">
          <name name-style="western">
            <surname>Scherf</surname>
            <given-names>Nico</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4003-9121</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author">
          <name name-style="western">
            <surname>Niehaus</surname>
            <given-names>Sebastian</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1291-6836</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>AICURA Medical GmbH</institution>
        <addr-line>Berlin</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Institute of Medical Informatics</institution>
        <institution>Charité – Universitätsmedizin Berlin</institution>
        <addr-line>Berlin</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>idalab GmbH</institution>
        <addr-line>Berlin</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Digital Health – Connected Healthcare, Hasso Plattner Institute</institution>
        <institution>University of Potsdam</institution>
        <addr-line>Potsdam</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Max Planck Institute for Human Cognitive and Brain Sciences</institution>
        <addr-line>Leipzig</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Evelyn Medawar <email>evelyn.medawar@aicura-medical.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>21</day>
        <month>3</month>
        <year>2023</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e43847</elocation-id>
      <history>
        <date date-type="received">
          <day>7</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>27</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>24</day>
          <month>1</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>1</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Elena Williams, Manuel Kienast, Evelyn Medawar, Janis Reinelt, Alberto Merola, Sophie Anne Ines Klopfenstein, Anne Rike Flint, Patrick Heeren, Akira-Sebastian Poncette, Felix Balzer, Julian Beimes, Paul von Bünau, Jonas Chromik, Bert Arnrich, Nico Scherf, Sebastian Niehaus. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 21.03.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2023/1/e43847" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Increasing digitalization in the medical domain gives rise to large amounts of health care data, which has the potential to expand clinical knowledge and transform patient care if leveraged through artificial intelligence (AI). Yet, big data and AI oftentimes cannot unlock their full potential at scale, owing to nonstandardized data formats, lack of technical and semantic data interoperability, and limited cooperation between stakeholders in the health care system. Despite the existence of standardized data formats for the medical domain, such as Fast Healthcare Interoperability Resources (FHIR), their prevalence and usability for AI remain limited.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In this paper, we developed a data harmonization pipeline (DHP) for clinical data sets relying on the common FHIR data standard.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We validated the performance and usability of our FHIR-DHP with data from the Medical Information Mart for Intensive Care IV database.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We present the FHIR-DHP workflow in respect of the transformation of “raw” hospital records into a harmonized, AI-friendly data representation. The pipeline consists of the following 5 key preprocessing steps: querying of data from hospital database, FHIR mapping, syntactic validation, transfer of harmonized data into the patient-model database, and export of data in an AI-friendly format for further medical applications. A detailed example of FHIR-DHP execution was presented for clinical diagnoses records.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our approach enables the scalable and needs-driven data modeling of large and heterogenous clinical data sets. The FHIR-DHP is a pivotal step toward increasing cooperation, interoperability, and quality of patient care in the clinical routine and for medical research.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data interoperability</kwd>
        <kwd>fast healthcare interoperability resources</kwd>
        <kwd>FHIR</kwd>
        <kwd>data standardization pipeline</kwd>
        <kwd>medical information mart for intensive care</kwd>
        <kwd>MIMIC IV</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI application</kwd>
        <kwd>AI</kwd>
        <kwd>deployment</kwd>
        <kwd>data</kwd>
        <kwd>usability</kwd>
        <kwd>care unit</kwd>
        <kwd>diagnosis</kwd>
        <kwd>cooperation</kwd>
        <kwd>patient care</kwd>
        <kwd>care</kwd>
        <kwd>medical research</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The increasing digitalization of health care creates vast amounts of clinical data that are collected and stored in an Electronic Health Record (EHR). Patient information from all medical domains is captured in diverse sets of data recorded in stand-alone systems. With the prevalent use of EHRs in health care organizations, there is abundant opportunity for the additional application of EHR data in clinical and translational research. For instance, such data can be used to develop artificial intelligence (AI) algorithms, which have the potential to transform patient care and medical research. Resource-intensive and inefficient clinical workflows could be optimized by the analysis of historical data with AI applications [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. In particular, the time-consuming and financially costly process of identifying and enrolling the right patients into a clinical trial manually can be reduced significantly by automation [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. However, the exchange of medical data remains limited due to the lack of data interoperability between health care providers, owing to outdated IT infrastructure, inconsistencies in data formats, poor data quality, inadequate data exchange solutions, and data silos [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. To achieve data interoperability, the following steps must be incorporated: (1) integration of isolated data silos, (2) safe exchange of data, and (3) effective use of the available data [<xref ref-type="bibr" rid="ref7">7</xref>]. Each of these operations includes database schema matching [<xref ref-type="bibr" rid="ref8">8</xref>] and schema mapping [<xref ref-type="bibr" rid="ref9">9</xref>], which allow translation of the relationships between the source database and the target data standard.</p>
      <p>Employing a harmonized data format will facilitate the exchange of medical data, enabling wide-ranging data-driven collaborations within the private and public health care sectors. Data interoperability requires EHR data to be structured in a common format and in standardized terminologies. Standardization is often performed by adopting the Health Level 7 Fast Healthcare Interoperability Resources (FHIR) model [<xref ref-type="bibr" rid="ref10">10</xref>], which is supported by numerous health care institutions and vendors of clinical information systems [<xref ref-type="bibr" rid="ref11">11</xref>]. FHIR is an international industry standard that integrates diverse sets of data in well-defined exchangeable segments of information, which are known as FHIR resources. Therefore, FHIR facilitates interoperability between health care organizations and allows third-party developers to provide medical applications that can be easily integrated into the existing systems. FHIR enables the harmonization of data and thus allows standardized data processing as well as the rollout of AI applications across different clinics and hospitals regardless of which information system they use. Consequently, FHIR forms an important component for the scalable development and deployment of AI in clinics and hospitals.</p>
      <p>However, to apply AI, the input data need to be adapted to the AI algorithms. The conventional AI frameworks such as Tensorflow [<xref ref-type="bibr" rid="ref12">12</xref>] and Pytorch [<xref ref-type="bibr" rid="ref13">13</xref>] require data to take a tensor form, which is a vector or matrix of n-dimensions that represents various types of data (eg, tabular, time series, image, and text). Since the FHIR format has a multilayered nested structure, a use case–specific data preprocessing is needed. For instance, depending on the AI application and the chosen data source, a custom data preprocessing pipeline should be designed leading to diminished AI scalability. Prior research addressed this problem in different forms but focused on individual applications, thereby constraining the purpose of FHIR to be applicable regardless of the use case [<xref ref-type="bibr" rid="ref11">11</xref>]. There have been a few attempts to flatten the hierarchical FHIR structure and transform it into NDJSON-based data format [<xref ref-type="bibr" rid="ref14">14</xref>] or tabular format saved in CSV files [<xref ref-type="bibr" rid="ref15">15</xref>]. Such formats are more AI-friendly as they represent the data in a more accessible and standardized form for an application of common AI frameworks. Nonetheless, the NDJSON-based FHIR data transformation approach [<xref ref-type="bibr" rid="ref14">14</xref>] does not provide data selection criteria and filtering capabilities [<xref ref-type="bibr" rid="ref16">16</xref>]. The approach presented in [<xref ref-type="bibr" rid="ref15">15</xref>] requires expert knowledge of FHIRPath query language. Moreover, FHIR-based data preprocessing pipelines have been implemented in different contexts, for instance, as electronic data capture [<xref ref-type="bibr" rid="ref17">17</xref>], as a natural language processing tool [<xref ref-type="bibr" rid="ref12">12</xref>], and as a standardization protocol based on the Resource Description Framework [<xref ref-type="bibr" rid="ref6">6</xref>]. Despite the immense benefit they offer regarding processing EHR data, existing approaches are limited to specific use cases or require considerable data preparation to perform standardization. Furthermore, their final output is not easily accessible by common data preprocessing tools and thus hinders the application of AI.</p>
      <p>In this paper, we address the challenge of data interoperability in the health care sector by proposing an FHIR data harmonization pipeline (DHP) that provides EHR data in an AI-friendly format. The newly developed FHIR-DHP represents a data workflow solution that includes the aforementioned operations, such as data exchange, mapping, and export. Data privacy is a delicate topic in health care and is of great ethical concern [<xref ref-type="bibr" rid="ref18">18</xref>]. Given the degree of automation, FHIR-DHP should allow the preprocessing of unseen data in an isolated hospital environment, which makes harmonization privacy preserving.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>The authors did not seek an ethics review board assessment due to the methodology of the study, which included open datasets and data preprocessing pipelines only.</p>
      </sec>
      <sec>
        <title>FHIR-DHP Architecture Development</title>
        <p>In our work, we propose a generic solution to harmonize hospital EHR data. The FHIR-DHP was designed based on the extract-transform-load framework [<xref ref-type="bibr" rid="ref19">19</xref>], in which the data are pulled out (ie, queried) from diverse sources, processed into the desired format, and loaded into a data warehouse, namely the ”patient-model” database (DB). As the hospital database contains highly sensitive patient data, it is located behind the hospital’s security infrastructure and is completely isolated from outside access. Therefore, an edge-computation solution was designed, bringing the FHIR-DHP into the hospital’s own infrastructure. The edge-computation solution represents a set of frameworks that perform data querying, preprocessing, storage, and export. In this setting, direct access to the sensitive data is not required to run the standardization pipeline. The queries to the data are defined beforehand based on the database documentation.</p>
        <p>To bring the data into a harmonized form, we used an FHIR data model, which is applied by mapping the relationships between the source database and the desired data standard. The FHIR standard is straightforward to implement because it provides a choice of JSON, XML, or resource description format for data representation. The mapping pipeline was developed in the Python programming language to translate queried hospital data into matching FHIR concepts and save the resulting resources in JSON format. The semantics of features from the source database and FHIR concepts are examined using available database and FHIR documentation. The conversion to FHIR was designed to only support a core release 4 standard of the FHIR format to allow generic data preprocessing.</p>
        <p>To prevent errors in the remote data standardization scenario, the syntactic validation of FHIR resources is necessary. For instance, the conversion of data types can sometimes lead to erroneous values, especially with date features. Automatic syntactic validation allows the logging of occurred errors and the improvement of harmonization pipeline when working with unseen data. When syntactic validation is completed, FHIR resources should be transferred to the data warehouse to allow the fast and easy retrieval of standardized data for AI applications.</p>
        <p>In the final stage of data export, we designed the output that provides the benefits of the original FHIR format with a high level of clinical detail that is also easily accessible for computational tools. We wanted to restructure the data representation in a way that supports effortless data selection and filtering capabilities and would not require a knowledge of FHIRPath query language. Consequently, this output format would enable the smooth conversion of data into a “tensor” format required by conventional AI frameworks.</p>
      </sec>
      <sec>
        <title>FHIR-DHP Validation</title>
        <p>To demonstrate and evaluate how the FHIR-DHP works, we used the openly available Medical Information Mart for Intensive Care IV (MIMIC IV) database [<xref ref-type="bibr" rid="ref20">20</xref>]. MIMIC IV includes patient data from the intensive care units at a tertiary academic medical center in Boston, MA, United States. We selected a wide range of tables from MIMIC IV, which cover most of the events occurring during the hospital stay as well as core patient details, information about admissions, and hospital transfers (further referred to as core tables). The event tables include laboratory results, diagnoses, prescriptions, and other details, as shown in <xref ref-type="table" rid="table1">Table 1</xref>. In addition, MIMIC IV includes the so-called reference tables containing matching dictionaries with medical terms that are used in the hospital records.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Selected core and event Medical Information Mart for Intensive Care IV (MIMIC IV) tables as well as the reference dictionary tables that were merged together with core and event tables for Fast Healthcare Interoperability Resources mapping.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="480"/>
            <col width="520"/>
            <thead>
              <tr valign="top">
                <td>Selected core and event MIMIC IV tables</td>
                <td>Selected MIMIC IV reference tables</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Patient</td>
                <td>—<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>Admissions</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Transfers</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Chartevents</td>
                <td>d_items</td>
              </tr>
              <tr valign="top">
                <td>Labevents</td>
                <td>d_labitems</td>
              </tr>
              <tr valign="top">
                <td>Procedureevents</td>
                <td>d_items</td>
              </tr>
              <tr valign="top">
                <td>Prescriptions</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Inputevents</td>
                <td>d_items</td>
              </tr>
              <tr valign="top">
                <td>Microbiologyevents</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Outputevents</td>
                <td>d_items</td>
              </tr>
              <tr valign="top">
                <td>Procedures_icd</td>
                <td>d_icd_procedures</td>
              </tr>
              <tr valign="top">
                <td>Diagnoses_icd</td>
                <td>d_icd_diagnoses</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Not available.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The selected tables were mapped to FHIR standard. Automatic semantic validation is unfeasible, so 2 of the authors manually validated the mapping semantics independently of each other. There are many tools that perform automatic syntactic validation, such as the Python-based package “fhir.resources” used herein [<xref ref-type="bibr" rid="ref21">21</xref>]. To evaluate the exporting of data from the patient-model DB, we retrieved the diagnosis records.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>FHIR-DHP Architecture</title>
        <p>The approach presented here represents a scalable protocol for harmonizing hospital EHR data sets based on 5 stages from data query to data export in a standardized format.</p>
        <sec>
          <title>Querying Data From the Hospital Database</title>
          <p>To connect the FHIR-DHP pipeline to the hospital DB, a communication server is employed. This server runs all necessary queries to retrieve the patient data. The query execution can be run at regular intervals as well as in batches of patients, so as not to overload the data pipeline. Furthermore, the queries prestructure the data according to their semantic relations before proceeding to data mapping.</p>
        </sec>
        <sec>
          <title>Mapping Data to FHIR</title>
          <p>FHIR allows describing data formats and elements that are recorded as “resources” and an application programming interface for exchanging EHRs. To perform the mappings, semantics of features from the source database and FHIR concepts are explored as well as the relationships between the data tables. Consequently, the mappings between the database tables and FHIR resources are defined. Features where a matching FHIR concept is not found are excluded. The resulting FHIR resources are then saved in JSON format.</p>
        </sec>
        <sec>
          <title>Syntactic Validation of FHIR Mappings</title>
          <p>During validation, mapped data are ensured to have the correct data types as well as the syntactic format where the hierarchy is maintained, and entries follow FHIR standard specifications. All mappings are validated first during the development stage to identify structural errors and data type inconsistencies. A validation algorithm is incorporated into the pipeline to confirm the correctness of the transformed data in the remote data standardization scenario.</p>
        </sec>
        <sec>
          <title>Transferring FHIR Resources to Patient-Model DB</title>
          <p>The DB of choice for the patient model is Postgres [<xref ref-type="bibr" rid="ref22">22</xref>], which is an open-source relational DB management system featuring SQL compliance and storage of JSON documents. The database for the FHIR resources is used to harmonize the locally available data only once to allow the further application of various medical AI-based solutions. The data are stored according to FHIR resource type where each resource is saved in a separate JSON structure.</p>
        </sec>
        <sec>
          <title>Exporting Data Into Custom JSON format</title>
          <p>To export the data from the patient-model DB, the selection is performed by outlining the tables and features of interest in a configuration file, which is then used to determine which harmonized data should be queried. FHIRPath queries were written to retrieve all elements from FHIR resources adhering to specific formatting rules in respect of the predefined key-value structure and to place the extracted elements into the custom JSON file. Such transformation flattens the hierarchical structure of FHIR resources and makes the data more accessible for common data preprocessing tools. The final flattened output does not require expert knowledge of FHIRPath query language and supports effortless data selection and filtering. The resulting file also allows the uncomplicated conversion of data into a “tensor” format required by conventional AI frameworks and fast data selection based on the following 4 keys: feature_name, table_name, value, and metadata.</p>
          <p>In <xref rid="figure1" ref-type="fig">Figure 1</xref>, we demonstrate how the FHIR-DHP recodes nested FHIR syntax to more accessible features in an AI-friendly format. Example FHIR concepts from an observation resource are given in <xref rid="figure1" ref-type="fig">Figure 1</xref>a, where the code’s entity “text” defines the record or measurement label. The entity “text” is often duplicated in the item “display.” However, depending on the coding system, this “display” item can change, whereas “text” always stays the same and is therefore used as a feature name. The information from the FHIR resource is grouped into the 4 concept keys of feature name (eg, “Blood pressure”), value (eg, “114”), table name (eg, “observation”), and metadata (<xref rid="figure1" ref-type="fig">Figure 1</xref>b). For a given FHIR resource type, the metadata may include concepts such as dates, references, coding system details, and resource ID, among other things. As an output, feature names together with a corresponding value and available metadata are provided in a custom JSON structure (<xref rid="figure1" ref-type="fig">Figure 1</xref>c). The defined format allows uncomplicated data selection and aggregation based on resource type (eg, “table_name”), feature name, and value. Additional information in a standardized format can be easily accessed from the metadata key and allows further data manipulation.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Conceptual overview for an exemplary Fast Healthcare Interoperability Resources (FHIR) structure and hospital record, which are transformed from FHIR standard to an artificial intelligence (AI)–friendly format.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e43847_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>FHIR-DHP Validation</title>
        <p>The MIMIC IV data were queried accordingly to the defined FHIR mappings. The core and event MIMIC IV tables were merged with reference tables to contain a complete description of the hospital records. As a result, the data were grouped and restructured into the information blocks required in FHIR standard. Manual independent validation of the mapping semantics resulted in slight discrepancies, which were subsequently resolved to adhere closely to the FHIR standard. The automatic syntactic validation allowed the prompt verification of standardization operations.</p>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows to which FHIR resources the MIMIC IV tables were mapped. The largest proportion of tables (4 out of 12 tables) were mapped to the <italic>Observation</italic> FHIR resource type, which included lab, microbiology, output, and charted events collected throughout the patient’s stay. The information on admissions and transfers was translated into the <italic>Encounter</italic> FHIR resource (2 out of 12 tables). Procedure events and International Classification of Diseases codes (2 out of 12 tables) were stored in the <italic>Procedure</italic> FHIR resource. Given that the prescriptions table contains medication requests (1 out of 12 tables) and the input events table holds records of medication administration (1 out of 12 tables), these tables were mapped to the corresponding FHIR resource types. Finally, the <italic>Condition</italic> FHIR resource was used to map the table with the patients’ diagnosis details (1 out of 12 tables).</p>
        <p>In <xref ref-type="table" rid="table3">Table 3</xref>, we demonstrate how the mapping of the MIMIC IV “diagnoses_icd” table to <italic>Condition</italic> FHIR resource was conducted. Multiple columns of the “diagnoses_icd” table such as “icd_code”, “icd_version,” and “long_title” were mapped to the FHIR “condition.code” concept, which has a nested structure and provides keys to store the exact International Classification of Diseases code, the version of the coding system, and the code title. The full diagnosis title was mapped both to the “display” and “text” entities.</p>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows an example of how queried diagnoses records are harmonized to an AI-friendly format. The standardization follows the FHIR-DHP stages described above. At first, the raw data from tables “diagnoses_icd” and “d_icd_diagnoses” are queried (<xref rid="figure2" ref-type="fig">Figure 2</xref>a) and merged accordingly to the defined FHIR mappings. Then, the features are renamed as defined in <xref ref-type="table" rid="table3">Table 3</xref> for the FHIR condition resource, and the required entities such as “resourceType” and “id” are created (<xref rid="figure2" ref-type="fig">Figure 2</xref>b). Finally, the values are placed into a nested FHIR structure (<xref rid="figure2" ref-type="fig">Figure 2</xref>c), and subsequently, the data are transformed into a JSON format (<xref rid="figure2" ref-type="fig">Figure 2</xref>d), which can be automatically validated (<xref rid="figure2" ref-type="fig">Figure 2</xref>e) and saved in the patient-model DB. When the resource is not approved in terms of its syntactic quality (eg, data type, nested structure, or cardinality), an error is raised, which prevents the further saving of this resource in the patient-model DB (<xref rid="figure2" ref-type="fig">Figure 2</xref>e). Otherwise, the resource is transferred into a storage (<xref rid="figure2" ref-type="fig">Figure 2</xref>f), and the requested data are exported in a custom AI-friendly JSON format (<xref rid="figure2" ref-type="fig">Figure 2</xref>g).</p>
        <p>We provide an example of a further 2-step transformation of harmonized diagnosis data to a “tensor” format in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Overview of the mappings performed on the selected Medical Information Mart for Intensive Care (MIMIC) database (DB) tables to Fast Healthcare Interoperability Resources (FHIR) types.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="470"/>
            <col width="530"/>
            <thead>
              <tr valign="top">
                <td>MIMIC IV DB</td>
                <td>FHIR resource type</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Patients</td>
                <td>Patient</td>
              </tr>
              <tr valign="top">
                <td>Admissions</td>
                <td>Encounter</td>
              </tr>
              <tr valign="top">
                <td>Transfers</td>
                <td>Encounter</td>
              </tr>
              <tr valign="top">
                <td>Chartevents</td>
                <td>Observation</td>
              </tr>
              <tr valign="top">
                <td>Labevents</td>
                <td>Observation</td>
              </tr>
              <tr valign="top">
                <td>Procedureevents</td>
                <td>Procedure</td>
              </tr>
              <tr valign="top">
                <td>Prescriptions</td>
                <td>MedicationRequest</td>
              </tr>
              <tr valign="top">
                <td>Inputevents</td>
                <td>MedicationAdministration</td>
              </tr>
              <tr valign="top">
                <td>Microbiologyevents</td>
                <td>Observation</td>
              </tr>
              <tr valign="top">
                <td>Outputevents</td>
                <td>Observation</td>
              </tr>
              <tr valign="top">
                <td>Procedure_icd</td>
                <td>Procedure</td>
              </tr>
              <tr valign="top">
                <td>Diagnoses_icd</td>
                <td>Condition</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Mapping of “diagnoses_icd” table to Condition Fast Healthcare Interoperability Resources (FHIR) resource.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="570"/>
            <col width="430"/>
            <thead>
              <tr valign="top">
                <td>MIMIC<sup>a</sup> format</td>
                <td>FHIR resource format</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>mimic.diagnoses_icd.subject_id</td>
                <td>fhir.condition.subject</td>
              </tr>
              <tr valign="top">
                <td>mimic.diagnoses_icd.hadm_id</td>
                <td>fhir.condition.encounter</td>
              </tr>
              <tr valign="top">
                <td>mimic.diagnoses_icd.icd_code</td>
                <td>fhir.condition.code_code</td>
              </tr>
              <tr valign="top">
                <td>mimic.diagnoses_icd.icd_version</td>
                <td>fhir.condition.code_version</td>
              </tr>
              <tr valign="top">
                <td>mimic.diagnoses_icd.long_title</td>
                <td>fhir.condition.code_display</td>
              </tr>
              <tr valign="top">
                <td>mimic.diagnoses_icd.long_title</td>
                <td>fhir.condition.code_text</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>MIMIC: Medical Information Mart for Intensive Care.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Flowchart showing an example diagnosis data being processed through the 5 stages in Fast Healthcare Interoperability Resources (FHIR) data harmonization pipeline (DHP). The first stage (a) includes querying of the diagnoses records, at the second stage (b-c) the data are mapped to FHIR standard, and the third stage carries out the syntactic resource validation. (f) If the FHIR resource is successfully validated, it is being transferred into the patient-model database (DB), and then (g) exported in a custom artificial intelligence (AI)–friendly JSON format.</p>
          </caption>
          <graphic xlink:href="medinform_v11i1e43847_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The Harmonization of EHR data is a crucial step toward increasing cooperation, interoperability, and quality of patient care in the clinical routine and medical research. To drive the harmonization of medical data forward, we developed the FHIR-DHP and evaluated it on key MIMIC IV tables. A detailed example of data standardization was presented for clinical diagnosis records from the MIMIC IV database. The FHIR-DHP allows the querying of health data in an isolated environment by employing an edge-computation solution and a communication server, which retrieve patient data and prestructure it for further mapping to the FHIR standard. A validation step ensures syntactic compliance and initiates the transfer of formatted data to the patient-model DB. The data export provides FHIR resources in a custom JSON file format.</p>
        <p>Owing to the FHIR format’s multilayered nested structure, its accessibility for AI algorithms is low as it requires transformation into a format compatible with common data preprocessing tools. Thus far, a number of studies have attempted to solve this problem. However, the final output of these studies has not supported data selection criteria and filtering capabilities [<xref ref-type="bibr" rid="ref14">14</xref>] and requires expert knowledge of FHIRPath query language [<xref ref-type="bibr" rid="ref15">15</xref>]. In this study, we introduce a custom JSON format that represents a higher level of abstraction to support easier data selection based on the following 4 keys: feature_name, table_name, value, and metadata. Moreover, the newly developed JSON structure fits the expected data format of common data preprocessing frameworks, which are designed to work efficiently with tabular data. As a result, the output presented facilitates the generic and fast deployment of AI and patient cohort identification algorithms.</p>
        <p>In comparison to [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], the details of FHIR-DHP execution inside the hospital environment in respect of protecting data privacy are discussed. This step, though crucial, is often omitted and left out of the published standardization protocols. The edge-computation solution sets up the FHIR-DHP in a privacy-preserving way where the preprocessing of the patient-related data is performed inside the hospital and is completely isolated from outside access. The so-called federated learning (FL) framework [<xref ref-type="bibr" rid="ref25">25</xref>] can be integrated into the FHIR-DHP workflow to run algorithms locally, using data from the on-premises database in the respective hospitals and to merge model parameters centrally in the cloud without any patient data leaving the hospital. The FL framework requires data to be in a consistent format across various hospital systems. The developed pipeline achieves such a format and enables the scaling of AI applications.</p>
        <p>Thus far, there are only 2 studies attempting to perform the mapping of an MIMIC IV database [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. In [<xref ref-type="bibr" rid="ref26">26</xref>], the mapping was performed on fewer tables than our approach (8 versus 12 tables). The FHIR mappings from [<xref ref-type="bibr" rid="ref27">27</xref>] have been recently released and were not yet widely validated. Similar to the approach taken in [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], FHIR-DHP includes the verification of the performed FHIR mapping, which is essential to ensure the validity of data transformation and to adhere to FHIR version updates. Moreover, in comparison to [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], FHIR-DHP represents a generic approach to standardize EHR data and can be applied to various hospital database systems.</p>
        <p>With the introduction of the FHIR-DHP into the hospital environment, a number of patient-stay parameters can be potentially optimized using AI-based algorithms. For example, the length of stay as well as mortality could be reduced [<xref ref-type="bibr" rid="ref28">28</xref>], and patients suitable for trial treatment could be automatically and efficiently identified [<xref ref-type="bibr" rid="ref29">29</xref>]. In consequence, the financial impact on medical providers in respect of personnel time and resources would decrease considerably. The FHIR-DHP aims to bring health care closer to digital transformation and thus toward “Healthcare 4.0” [<xref ref-type="bibr" rid="ref30">30</xref>] by making EHR data usable “from bedside-to-bench.” By inverting the idea of translational research, in contrast to “from bench-to-bedside,” accessing the full potential of medical big data with AI will further inform and advance basic research.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are several limitations that we would like to emphasize. FHIR-DHP only works with a core standard of the FHIR format. Those core FHIR resource types have a bounded set of concepts that present a constraint to mapping accuracy. Although the standard resources can be expanded using a profiling technique or FHIR extensions, the use of those would make the FHIR-DHP less generic. Hence, we implemented the mapping using only the standard FHIR resources and omitted some of the MIMIC IV data features that did not have a matching concept in FHIR. Additionally, the FHIR mapping step is subject to the extent of the detail of the database documentation used to infer the semantic and syntactic properties of the data. A solution for an automatic concept recognition can potentially solve this problem. The existing approach in [<xref ref-type="bibr" rid="ref6">6</xref>] is limited to a small number of FHIR resources and requires an extensive data preparation. Further experiments in this direction could alleviate the concept-matching problem and the requirement for a detailed database description. Moreover, the validation and robustness of FHIR-DHP needs to be tested on other EHR data sets to evaluate its generic setup. In addition, to validate the FHIR-DHP compatibility with machine learning pipelines, further experiments are needed.</p>
      </sec>
      <sec>
        <title>Future Prospects</title>
        <p>The proposed FHIR-DHP pipeline highlights the therein featured essential data standardization stages and holds the potential to becoming an interoperable harmonization system with an AI-friendly data format. FHIR-DHP enables interoperability and cooperation between clinical institutions and a rapid patient cohort identification for clinical trials; it also unlocks the potential of big medical data.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We provide a comprehensive approach to transforming unstandardized EHR data into a harmonized multilayered nested FHIR format and then to a more readable and more efficient AI-friendly JSON structure. We developed a 5-stage data harmonization pipeline, which includes validation checks. The AI-friendly format of hospital data allows the generic and fast integration of both AI and patient cohort identification algorithms. Harmonized and standardized health care data are of great value to advancing efficiency in big data processing, cooperation, and multicenter data exchange in the clinical sector, boosting medical research, patient care, and clinical trial cohort identification. The next steps would include validating our approach in a hospital environment and applying a privacy-preserving FL framework to make use of advanced AI deployment.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Transformation of data saved in custom JSON to tensor format.</p>
        <media xlink:href="medinform_v11i1e43847_app1.docx" xlink:title="DOCX File , 998 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DB</term>
          <def>
            <p>database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DHP</term>
          <def>
            <p>data harmonization pipeline</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EHR</term>
          <def>
            <p>Electronic Health Record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">FHIR</term>
          <def>
            <p>Fast Healthcare Interoperability Resources</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">FL</term>
          <def>
            <p>federated learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">MIMIC</term>
          <def>
            <p>Medical Information Mart for Intensive Care</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was partially funded by the German Federal Ministry of Education and Research under Grant 16SV8559.</p>
    </ack>
    <notes>
      <sec>
        <title>Availability of Data and Materials</title>
        <p>The MIMIC IV database used in this study is openly available to credentialed users who sign the “Data Use Agreement” at PhysioNet website [<xref ref-type="bibr" rid="ref20">20</xref>]. The code is not publicly available due to privacy, but a demo is available from the corresponding author on request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>EW, SN, MK, JR, and AM were responsible for the study conception; EW and MK took part in data analysis; EW, SN, and EM created the figures; EW, MK, AM, and SN were responsible for methods. EW, EM, JR, and SAIK wrote the draft; BA, JB, PVB, JC, ARF, ASP, and NS reviewed and revised the work.</p>
      </fn>
      <fn fn-type="conflict">
        <p>FB reports grants from the German Federal Ministry of Education and Research, German Federal Ministry of Health, Berlin Institute of Health, personal fees from Elsevier Publishing, grants from Hans Böckler Foundation, other from Robert Koch Institute, grants from Einstein Foundation, grants from Berlin University Alliance, personal fees from Medtronic and personal fees from GE Healthcare.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Au-Yeung</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Sahani</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Isselbacher</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Armoundas</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Reduction of false alarms in the intensive care unit using an optimized machine learning based approach</article-title>
          <source>NPJ Digit Med</source>
          <year>2019</year>
          <volume>2</volume>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-019-0160-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-019-0160-7</pub-id>
          <pub-id pub-id-type="medline">31508497</pub-id>
          <pub-id pub-id-type="pii">160</pub-id>
          <pub-id pub-id-type="pmcid">PMC6728371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Desautels</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Calvert</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kerem</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shieh</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shimabukuro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chettipally</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Feldman</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Barton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wales</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Prediction of Sepsis in the Intensive Care Unit With Minimal Electronic Health Record Data: A Machine Learning Approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2016</year>
          <month>09</month>
          <day>30</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>e28</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2016/3/e28/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.5909</pub-id>
          <pub-id pub-id-type="medline">27694098</pub-id>
          <pub-id pub-id-type="pii">v4i3e28</pub-id>
          <pub-id pub-id-type="pmcid">PMC5065680</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maier</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kapsner</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mate</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Prokosch</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kraus</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Patient Cohort Identification on Time Series Data Using the OMOP Common Data Model</article-title>
          <source>Appl Clin Inform</source>
          <year>2021</year>
          <month>01</month>
          <day>27</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>57</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0040-1721481"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0040-1721481</pub-id>
          <pub-id pub-id-type="medline">33506478</pub-id>
          <pub-id pub-id-type="pmcid">PMC7840432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Perentesis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lingren</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Deleger</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Solti</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Increasing the efficiency of trial-patient matching: automated clinical trial eligibility pre-screening for pediatric oncology patients</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2015</year>
          <month>04</month>
          <day>14</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>28</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-015-0149-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-015-0149-3</pub-id>
          <pub-id pub-id-type="medline">25881112</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-015-0149-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC4407835</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Mello</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Rigo</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>da Costa</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>da Rosa Righi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Donida</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bez</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Schunke</surname>
              <given-names>LC</given-names>
            </name>
          </person-group>
          <article-title>Semantic interoperability in health records standards: a systematic literature review</article-title>
          <source>Health Technol (Berl)</source>
          <year>2022</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>255</fpage>
          <lpage>272</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35103230"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12553-022-00639-w</pub-id>
          <pub-id pub-id-type="medline">35103230</pub-id>
          <pub-id pub-id-type="pii">639</pub-id>
          <pub-id pub-id-type="pmcid">PMC8791650</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kiourtis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mavrogiorgou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menychtas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maglogiannis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kyriazis</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Structurally Mapping Healthcare Data to HL7 FHIR through Ontology Alignment</article-title>
          <source>J Med Syst</source>
          <year>2019</year>
          <month>02</month>
          <day>05</day>
          <volume>43</volume>
          <issue>3</issue>
          <fpage>62</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-019-1183-y</pub-id>
          <pub-id pub-id-type="medline">30721349</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-019-1183-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pagano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Candela</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Castelli</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Data Interoperability</article-title>
          <source>Data Sci. J</source>
          <year>2013</year>
          <volume>12</volume>
          <fpage>GRDI19</fpage>
          <lpage>GRDI25</lpage>
          <pub-id pub-id-type="doi">10.2481/dsj.GRDI-004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A Survey of Approaches to Automatic Schema Matching</article-title>
          <source>VLDB J</source>
          <year>2001</year>
          <volume>10</volume>
          <fpage>334</fpage>
          <lpage>350</lpage>
          <pub-id pub-id-type="doi">10.1007/s007780100057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolaitischema</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>data</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>metadata</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Schema mappings, data exchange, and metadata management</article-title>
          <year>2005</year>
          <conf-name>Proceedings of the ACM SIGACT-SIGMOD-SIGART Symposium on Principles of Database Systems</conf-name>
          <conf-date>June 13-15, 2005</conf-date>
          <conf-loc>Baltimore, USA</conf-loc>
          <fpage>61</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1145/1065167.1065176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <article-title>Welcome to FHIR</article-title>
          <source>HL7.org</source>
          <access-date>2023-02-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hl7.org/fhir/">https://www.hl7.org/fhir/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vorisek</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Lehne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Klopfenstein</surname>
              <given-names>SAI</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bartschke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haese</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Thun</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Fast Healthcare Interoperability Resources (FHIR) for Interoperability in Health Research: Systematic Review</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>07</month>
          <day>19</day>
          <volume>10</volume>
          <issue>7</issue>
          <fpage>e35724</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/7/e35724/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35724</pub-id>
          <pub-id pub-id-type="medline">35852842</pub-id>
          <pub-id pub-id-type="pii">v10i7e35724</pub-id>
          <pub-id pub-id-type="pmcid">PMC9346559</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martín</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ashish</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Eugene</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhifeng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Greg</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Devin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghemawat</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goodfellow</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Harp</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Irving</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Isard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jozefowicz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kudlur</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Levenberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mane</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Monga</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Olah</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shlens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Talwar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vanhoucke</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vasudevan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Viegas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Vinyals</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Warden</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wattenberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wicke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>TensorFlow: Large-Scale Machine Learning on Heterogeneous Systems</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <fpage>1</fpage>
          <lpage>19</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bradbury</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chanan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Killeen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gimelshein</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Antiga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Desmaison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Köpf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>DeVito</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Raison</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chilamkurthy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chintala</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>PyTorch: An Imperative Style, High-Performance Deep Learning Library</article-title>
          <source>NeurIPS Proceedings</source>
          <access-date>2023-02-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.neurips.cc/paper/2019/file/bdbca288fee7f92f2bfa9f7012727740-Paper.pdf">https://proceedings.neurips.cc/paper/2019/file/bdbca288fee7f92f2bfa​9f7012727740-Paper.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sahu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ignatov</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gottlieb</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>KD</given-names>
            </name>
          </person-group>
          <article-title>High Performance Computing on Flat FHIR Files Created with the New SMART/HL7 Bulk Data Access Standard</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2019</year>
          <volume>2019</volume>
          <fpage>592</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32308853"/>
          </comment>
          <pub-id pub-id-type="medline">32308853</pub-id>
          <pub-id pub-id-type="pmcid">PMC7153160</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oehm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Storck</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fechner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brix</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yildirim</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dugas</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>FhirExtinguisher: A FHIR Resource Flattening Tool Using FHIRPath</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2021</year>
          <month>05</month>
          <day>27</day>
          <volume>281</volume>
          <fpage>1112</fpage>
          <lpage>1113</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI210369</pub-id>
          <pub-id pub-id-type="medline">34042862</pub-id>
          <pub-id pub-id-type="pii">SHTI210369</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Suominen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gedeon</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Adapting State-of-the-Art Deep Language Models to Clinical Information Extraction Systems: Potentials, Challenges, and Solutions</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>04</month>
          <day>25</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e11499</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/2/e11499/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11499</pub-id>
          <pub-id pub-id-type="medline">31021325</pub-id>
          <pub-id pub-id-type="pii">v7i2e11499</pub-id>
          <pub-id pub-id-type="pmcid">PMC6658232</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Developing an FHIR-Based Computational Pipeline for Automatic Population of Case Report Forms for Colorectal Cancer Clinical Trials Using Electronic Health Records</article-title>
          <source>JCO Clinical Cancer Informatics</source>
          <year>2020</year>
          <month>11</month>
          <issue>4</issue>
          <fpage>201</fpage>
          <lpage>209</lpage>
          <pub-id pub-id-type="doi">10.1200/cci.19.00116</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mittelstadt</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Floridi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>The Ethics of Big Data: Current and Foreseeable Issues in Biomedical Contexts</article-title>
          <source>Sci Eng Ethics</source>
          <year>2016</year>
          <month>04</month>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>303</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1007/s11948-015-9652-2</pub-id>
          <pub-id pub-id-type="medline">26002496</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11948-015-9652-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denney</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Armistead</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>BN</given-names>
            </name>
          </person-group>
          <article-title>Validating the extract, transform, load process used to populate a large clinical research database</article-title>
          <source>Int J Med Inform</source>
          <year>2016</year>
          <month>10</month>
          <volume>94</volume>
          <fpage>271</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27506144"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.07.009</pub-id>
          <pub-id pub-id-type="medline">27506144</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(16)30170-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5556907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bulgarelli</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Horng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-IV</article-title>
          <source>PhysioNet</source>
          <year>2021</year>
          <volume>101</volume>
          <issue>23</issue>
          <fpage>e215</fpage>
          <lpage>e220</lpage>
          <pub-id pub-id-type="doi">10.13026/s6n6-xd98</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>FHIR® Resources</article-title>
          <source>GitHub</source>
          <access-date>2023-02-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/nazrulworld/fhir.resources">https://github.com/nazrulworld/fhir.resources</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>PostgreSQL: The World's Most Advanced Open Source Relational Database</article-title>
          <source>PostgreSQL Global Development Group</source>
          <access-date>2023-02-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.postgresql.org">https://www.postgresql.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKinney</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Data Structures for Statistical Computing in Python</article-title>
          <source>SciPy.org</source>
          <year>2010</year>
          <access-date>2023-02-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://conference.scipy.org/proceedings/scipy2010/pdfs/mckinney.pdf">https://conference.scipy.org/proceedings/scipy2010/pdfs/mckinney.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Developing a scalable FHIR-based clinical data normalization pipeline for standardizing and integrating unstructured and structured electronic health record data</article-title>
          <source>JAMIA Open</source>
          <year>2019</year>
          <month>12</month>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>570</fpage>
          <lpage>579</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32025655"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooz056</pub-id>
          <pub-id pub-id-type="medline">32025655</pub-id>
          <pub-id pub-id-type="pii">ooz056</pub-id>
          <pub-id pub-id-type="pmcid">PMC6993992</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Konečný</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McMahan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ramage</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Richtárik</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Federated Optimization: Distributed Machine Learning for On-Device Intelligence</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <month>10</month>
          <day>8</day>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1610.02527"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ulrich</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Behrend</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wiedekopf</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Drenkhahn</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kock-Schoppenhauer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ingenerf</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Hands on the Medical Informatics Initiative Core Data Set - Lessons Learned from Converting the MIMIC-IV</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2021</year>
          <month>09</month>
          <day>21</day>
          <volume>283</volume>
          <fpage>119</fpage>
          <lpage>126</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI210549</pub-id>
          <pub-id pub-id-type="medline">34545827</pub-id>
          <pub-id pub-id-type="pii">SHTI210549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wiedekopf</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ulrich</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-IV Clinical Database Demo on FHIR (version 2)</article-title>
          <source>PhysioNet</source>
          <year>2022</year>
          <fpage>e-215</fpage>
          <lpage>e-220</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shimabukuro</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Barton</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Feldman</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Mataraso</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Effect of a machine learning-based severe sepsis prediction algorithm on patient survival and hospital length of stay: a randomised clinical trial</article-title>
          <source>BMJ Open Respir Res</source>
          <year>2017</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>e000234</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopenrespres.bmj.com/lookup/pmidlookup?view=long&#38;pmid=29435343"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjresp-2017-000234</pub-id>
          <pub-id pub-id-type="medline">29435343</pub-id>
          <pub-id pub-id-type="pii">bmjresp-2017-000234</pub-id>
          <pub-id pub-id-type="pmcid">PMC5687546</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarmiento</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dernoncourt</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Improving Patient Cohort Identification Using Natural Language Processing</article-title>
          <source>Data MITC</source>
          <year>2016</year>
          <fpage>405</fpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-43742-2_28</pub-id>
          <pub-id pub-id-type="medline">31314253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carayon</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Health Care 4.0: A Vision for Smart and Connected Health Care</article-title>
          <source>IISE Trans Healthc Syst Eng</source>
          <year>2021</year>
          <month>02</month>
          <day>15</day>
          <volume>11</volume>
          <issue>3</issue>
          <fpage>171</fpage>
          <lpage>180</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34497970"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/24725579.2021.1884627</pub-id>
          <pub-id pub-id-type="medline">34497970</pub-id>
          <pub-id pub-id-type="pmcid">PMC8423174</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
