<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e49542</article-id><article-id pub-id-type="doi">10.2196/49542</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Transforming Primary Care Data Into the Observational Medical Outcomes Partnership Common Data Model: Development and Usability Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Fruchart</surname><given-names>Mathilde</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Quindroit</surname><given-names>Paul</given-names></name><degrees>PhD, RN</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jacquemont</surname><given-names>Chlo&#x00E9;</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Beuscart</surname><given-names>Jean-Baptiste</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Calafiore</surname><given-names>Matthieu</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lamer</surname><given-names>Antoine</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Univ Lille, CHU Lille, ULR 2694 - METRICS: &#x00C9;valuation des Technologies de sant&#x00E9; et des, Pratiques m&#x00E9;dicales</institution>, <addr-line>2 Place de Verdun</addr-line><addr-line>Lille</addr-line>, <country>France</country></aff><aff id="aff2"><institution>D&#x00E9;partement de M&#x00E9;decine G&#x00E9;n&#x00E9;rale, University of Lille</institution>, <addr-line>Lille</addr-line>, <country>France</country></aff><aff id="aff3"><institution>F2RSM Psy - F&#x00E9;d&#x00E9;ration r&#x00E9;gionale de recherche en psychiatrie et sant&#x00E9; mentale Hauts-de-France</institution>, <addr-line>Saint-Andr&#x00E9;-Lez-Lille</addr-line>, <country>France</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Sylvestre</surname><given-names>Emmanuelle</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Ahmadi</surname><given-names>Najia</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Mathilde Fruchart, MSc, Univ Lille, CHU Lille, ULR 2694 - METRICS: &#x00C9;valuation des Technologies de sant&#x00E9; et des, Pratiques m&#x00E9;dicales, 2 Place de Verdun, Lille, F-59000, France; <email>mathilde.fruchart@univ-lille.fr</email></corresp></author-notes><pub-date pub-type="collection"><year>2024</year></pub-date><pub-date pub-type="epub"><day>13</day><month>8</month><year>2024</year></pub-date><volume>12</volume><elocation-id>e49542</elocation-id><history><date date-type="received"><day>01</day><month>06</month><year>2023</year></date><date date-type="rev-recd"><day>11</day><month>04</month><year>2024</year></date><date date-type="accepted"><day>11</day><month>04</month><year>2024</year></date></history><copyright-statement>&#x00A9; Mathilde Fruchart, Paul Quindroit, Chlo&#x00E9; Jacquemont, Jean-Baptiste Beuscart, Matthieu Calafiore, Antoine Lamer. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 13.8.2024. </copyright-statement><copyright-year>2024</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2024/1/e49542"/><abstract><sec><title>Background</title><p>Patient-monitoring software generates a large amount of data that can be reused for clinical audits and scientific research. The Observational Health Data Sciences and Informatics (OHDSI) consortium developed the Observational Medical Outcomes Partnership (OMOP) Common Data Model (CDM) to standardize electronic health record data and promote large-scale observational and longitudinal research.</p></sec><sec><title>Objective</title><p>This study aimed to transform primary care data into the OMOP CDM format.</p></sec><sec sec-type="methods"><title>Methods</title><p>We extracted primary care data from electronic health records at a multidisciplinary health center in Wattrelos, France. We performed structural mapping between the design of our local primary care database and the OMOP CDM tables and fields. Local French vocabularies concepts were mapped to OHDSI standard vocabularies. To validate the implementation of primary care data into the OMOP CDM format, we applied a set of queries. A practical application was achieved through the development of a dashboard.</p></sec><sec sec-type="results"><title>Results</title><p>Data from 18,395 patients were implemented into the OMOP CDM, corresponding to 592,226 consultations over a period of 20 years. A total of 18 OMOP CDM tables were implemented. A total of 17 local vocabularies were identified as being related to primary care and corresponded to patient characteristics (sex, location, year of birth, and race), units of measurement, biometric measures, laboratory test results, medical histories, and drug prescriptions. During semantic mapping, 10,221 primary care concepts were mapped to standard OHDSI concepts. Five queries were used to validate the OMOP CDM by comparing the results obtained after the completion of the transformations with the results obtained in the source software. Lastly, a prototype dashboard was developed to visualize the activity of the health center, the laboratory test results, and the drug prescription data.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Primary care data from a French health care facility have been implemented into the OMOP CDM format. Data concerning demographics, units, measurements, and primary care consultation steps were already available in OHDSI vocabularies. Laboratory test results and drug prescription data were mapped to available vocabularies and structured in the final model. A dashboard application provided health care professionals with feedback on their practice.</p></sec></abstract><kwd-group><kwd>data reuse</kwd><kwd>Observational Medical Outcomes Partnership</kwd><kwd>common data model</kwd><kwd>data warehouse</kwd><kwd>reproducible research</kwd><kwd>primary care</kwd><kwd>dashboard</kwd><kwd>electronic health record</kwd><kwd>patient tracking system</kwd><kwd>patient monitoring</kwd><kwd>EHR</kwd><kwd>primary care data</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The digitalization of health care organizations has made it possible to automatically collect and reuse data from electronic health records (EHRs) for care, administrative, and research purposes [<xref ref-type="bibr" rid="ref1">1</xref>]. Data reuse generally relies on extracting data from source databases, formatting and normalizing it in a data warehouse [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. Over the last few years, hospital-based data warehouses have started to provide comprehensive overviews of patient management during a hospital stay or on a hospital ward. However, these data warehouses do not contain data on primary care or other data not related to the hospital stay. These data cover first-line services&#x2014;outpatient care provided in local practices, including general practice, community pharmacy, dental care, and optometry [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Additionally, data from all individuals covered by the French national health insurance scheme are anonymously and prospectively included in the national claims database [<xref ref-type="bibr" rid="ref8">8</xref>]. These data are used for reimbursement purposes and are not clinical.</p><p>The reuse of EHR data is now a major topic of interest for hospital care [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] and primary care [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Several research groups have retrospectively reused primary care data on patients with neuromuscular diseases [<xref ref-type="bibr" rid="ref12">12</xref>], diabetes [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], dermatological diseases [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], lung diseases [<xref ref-type="bibr" rid="ref16">16</xref>], cancer [<xref ref-type="bibr" rid="ref17">17</xref>], or urinary tract infections [<xref ref-type="bibr" rid="ref18">18</xref>] or on older adult patients [<xref ref-type="bibr" rid="ref19">19</xref>]. Several national projects aim to collect primary care data on a routine basis. The main primary care projects are the Clinical Practice Research Datalink and The Health Improvement Network in the United Kingdom [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], the Veterans Administration data warehouses in the United States [<xref ref-type="bibr" rid="ref22">22</xref>], and the Canadian Primary Care Sentinel Surveillance Network in Canada [<xref ref-type="bibr" rid="ref23">23</xref>]. Nevertheless, the reuse of health care data (and especially primary care data) faces many challenges [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. The abovementioned projects collect data from millions of patients by implementing local data models. A UK project uses a national database (BioBank) to standardize vaccination data into a common data model (CDM) format [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>The heterogeneous structure of the data and the use of country- and facility-specific vocabularies create barriers to the implementation of multicenter studies and the sharing of data, methods, and results. Initiatives such as those proposed by the Observational Health Data Sciences and Informatics (OHDSI) consortium seek to (1) standardize data structure and vocabularies; (2) promote reproducible research and collaboration; and (3) share methods, tools, and results [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. The OHDSI has notably developed the Observational Medical Outcomes Partnership (OMOP) CDM [<xref ref-type="bibr" rid="ref31">31</xref>] and provides standard data structures and vocabularies that are independent of individual software developers and countries [<xref ref-type="bibr" rid="ref32">32</xref>].</p><p>Hospital and claims databases have already undergone the mapping process to adopt the OMOP CDM format [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. Nevertheless, primary care data, specifically general practice data, which serve as a valuable addition to hospital and claims databases, are still rarely being integrated into the OMOP CDM format.</p><p>Data standardization might facilitate the development of common tools for health care professionals, such as activity dashboards and software for managing multicenter research projects. Hence, the primary objective of this study (part of the Primary Care Data Warehouse [PriCaDa] project) was to transform primary care data into the OMOP CDM format.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>The goal of the PriCaDa project is to reuse primary care data and to provide an overview of the practices of health care professionals working in primary care (family physicians, nurses, and pharmacists).</p><p>In this study, we used primary care data from a multidisciplinary health center (MHC) located in the town of Wattrelos, France, in collaboration with the software company that produced the MHC&#x2019;s EHR software (Weda). Weda ranks third in terms of sales volume, boasting over 20,000 health care professionals in France as users [<xref ref-type="bibr" rid="ref36">36</xref>]. We used an extract-transform-load (ETL) process to create a data warehouse (<xref ref-type="fig" rid="figure1">Figure 1</xref>), using Python and SQL scripts. The data warehouse was stored in a PostgreSQL database, using version 5.4 of the OMOP CDM [<xref ref-type="bibr" rid="ref31">31</xref>]. The first step in the ETL process was to extract, classify, and normalize entities from the XML files. The database was then scanned and assessed with the OHDSI tool White Rabbit [<xref ref-type="bibr" rid="ref37">37</xref>] to create a report on each raw table, attribute, and data type. The OHDSI tool Rabbit In A Hat was then used to implement the specifications of the structural mapping, which aims to associate each local table and local column to the corresponding OMOP nomenclature [<xref ref-type="bibr" rid="ref38">38</xref>]. Then, transformation steps normalize the structure and the semantic of the data source to the OMOP CDM format. The final step is to load the data into the OMOP CDM. The development of a dashboard was proposed for a practical application.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Pipeline of the primary care data transformation into the OMOP CDM. CDM: Common Data Model; ETL: extract-transform-load; OMOP: Observational Medical Outcomes Partnership.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e49542_fig01.png"/></fig></sec><sec id="s2-2"><title>Ethical Considerations</title><p>The study was approved by the staff at the MHC in Wattrelos and the management of the Weda software house. Furthermore, the study was registered with the French National Data Protection Commission (<italic>Commission nationale de l&#x2019;informatique et des libert&#x00E9;s</italic>; reference 2022&#x2010;203). In line with the French legislation on retrospective studies of anonymized data from routine clinical practice, approval by an institutional review board was not required [<xref ref-type="bibr" rid="ref39">39</xref>]. All the data collection and analysis methods complied with relevant guidelines and regulations. Patient confidentiality was maintained at all times, and all the data were anonymized before extraction. The Weda software exports data with an identifier for each patient and consultation. This identifier is replaced during the transformations with a unique artificial ID. For this unique ID, sequences provided by the database management system (ie, PostgreSQL) were generally used to create an autoincrement primary key.</p></sec><sec id="s2-3"><title>Data Extraction</title><p>Following approval by the MHC&#x2019;s staff, Weda exported an XML-based hierarchical structure file for each patient. A primary care consultation occurs in 4 steps. At each step, the family physician collects data on the patient&#x2019;s health status. In step one (arrival), the reason for consultation is recorded as free text. In step two (the interview), the physician records clinical signs and symptoms as free text. In step three (the examination), the physician makes biometric measurements and enters the data in a structured way in the appropriate fields of the software (variables, values, and units). Step four (the outcome) includes the diagnosis (if made, as free text), any drug prescriptions (documented with the <italic>Code Identifiant de Sp&#x00E9;cialit&#x00E9;</italic> [CIP; the French national drug code]), any referrals (as free text in a PDF letter), and information on vaccinations. The parts of the Weda software dedicated to these steps depend on the physician&#x2019;s habits; some physicians put all observations into a single field.</p><p>Furthermore, the family physician receives laboratory test results from medical laboratories and clinical reports from other specialist physicians. The test variables differ from one medical laboratory to another. For example, one laboratory might use the term &#x201C;creatinine&#x201D; and a specific unit, whereas another might use &#x201C;create&#x201D; and a different unit for the same variable. These reports were documented as free text.</p></sec><sec id="s2-4"><title>Transformation Steps</title><sec id="s2-4-1"><title>Semantic Mapping</title><p>The goal of semantic mapping was to link local vocabularies to standard vocabularies that have been defined by the OHDSI community and are available in an web-based tool [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. The difficulty of the mapping depends on the vocabularies available in the source data. We defined four difficulty levels: level 1 for local vocabulary items that already belonged to the standard OHDSI vocabulary; level 2 for local, nonstandard vocabulary items for which the mappings to the standard OHDSI vocabulary already existed; level 3 for local vocabulary items that did not correspond to the OHDSI vocabulary but were in a structured format (manual mapping was necessary); and level 4 for local vocabulary items that did not correspond to the OHDSI vocabulary and were in an unstructured format (free text). Natural language processing (NLP) techniques, such as fuzzy matching algorithms, SpaCy tools, and regular expressions, can be used for concept identification and information extraction. The free text (eg, reasons for consultation, symptoms, diagnosis, and clinical reports) was sometimes heterogeneous and unstructured. Indeed, a single free-text record can consolidate various types of information, including the reason for a consultation, the patient&#x2019;s clinical signs, and their diagnosis, all of which may vary based on the practices of the individual family physician.</p><p>For difficulty levels 2 and 3, the data were mapped manually and independently by two experts (MF and CJ). A &#x03BA; score was computed as a statistical metric for assessing the degree of consensus among the annotators tasked with assigning labels to data. It gauges the degree to which the annotators&#x2019; assessments align, while also considering the potential for chance agreement. The score ranges from 0 to 1 (1 for perfect agreement among annotators). A &#x03BA; score below 0.4 indicates weak agreement, a &#x03BA; score above 0.6 (60%) suggests moderate agreement, and a &#x03BA; score exceeding 0.8 (80%) signifies strong agreement [<xref ref-type="bibr" rid="ref41">41</xref>]. Any disagreements were settled by a third expert (PQ). This mapping provided correspondences between the local vocabulary items and standard vocabulary items. When necessary, new primary care concepts not available in the OHDSI vocabularies were loaded into the CONCEPT table. The Logical Observation Identifiers Names and Codes vocabulary was used to map laboratory test variables. The source laboratory test concepts contained the name of the laboratory test variable used by the laboratory, together with the unit. The text referencing the laboratory test variables was cleaned up by grouping equivalent source concepts. Punctuation and special characters were removed, and abbreviations or spelling differences were replaced and grouped under the full name (eg &#x201C;CRP&#x201D; was replaced with &#x201C;C-reactive protein&#x201D;). Chapter numbers or line numbers at the beginning of a line were removed. Multiple spaces were replaced by a single space, and stop words (eg, &#x201C;of,&#x201D; &#x201C;to,&#x201D; or &#x201C;an&#x201D;) were removed. The Systematized Nomenclature of Medicine was used to map biometric variables, with the Unified Code for Units of Measure for units of measurement and the <italic>International Classification of Diseases, 10th Revision</italic> (<italic>ICD-10</italic>) for the patient&#x2019;s medical history. Drug prescriptions were recorded using CIP drug name codes. The CIP code was extracted from the Weda EHR software and mapped to the Anatomical Therapeutic Chemical (ATC) code and then the RxNorm code (ATC to RxNorm mapping is already available in the OMOP CDM).</p><p>The new concepts were integrated into the CONCEPT table with a concept identifier greater than 2,000,000,000. When a local concept is mapped, the correspondence with a standard OMOP concept is loaded into the CONCEPT_RELATIONSHIP table (resulting in a link between a local concept identifier and a OMOP standard concept identifier). As a result, the identifiers of standard concepts can be loaded into the x_concept_id column of the corresponding table for the local concept (eg, new local concepts in the MEASUREMENT table that are mapped are associated with the standard concepts loaded into the measurement_concept_id column).</p></sec><sec id="s2-4-2"><title>Structural Mapping</title><p>The goal of structural mapping was to transform the source structure into the OMOP CDM structure. The mapping comprised two steps. In the first step, the relevant variables required for the OMOP model were selected and normalized in a table format. In the second step, the variables and table structures were transformed to match the OMOP CDM nomenclature. We observed that most of the medical histories were coded as free text, rather than nomenclature items. The DIAGNOSIS source table contained the information from the patient interview (clinical signs), the clinical examination (measurements), and the &#x201C;outcome&#x201D; parts of the consultation. However, this field contained data related to several types of medical information in text format. The MEASUREMENT table contained information from the &#x201C;laboratory data&#x201D; and &#x201C;biometrics&#x201D; source tables. Outliers were removed, and primary and foreign keys were identified. New artificial identifiers were created for the primary key in each table.</p></sec></sec><sec id="s2-5"><title>Data Loading and Quality Assessment</title><p>After the semantic and structural transformations, the data were loaded into the OMOP model. We used Achilles, a data quality assessment and visualization tool developed by the OHDSI community. Achilles reports the compliance of the mapping with the constraints of the OMOP CDM (the primary and foreign keys), the vocabulary (ie, the correct choice of concepts corresponding to each table), and the business rules (ie, rules that ensure data consistency, for example, data chronology respects real life). Based on the Achilles analysis tables, the Atlas server summarizes the results of the data quality assessment in a dashboard [<xref ref-type="bibr" rid="ref42">42</xref>]. Kahn et al [<xref ref-type="bibr" rid="ref43">43</xref>] have developed a data quality framework for the secondary use of EHR data integrated into the Atlas quality assessment dashboard. <italic>Conformance</italic> describes &#x201C;the compliance of the representation of data against internal or external formatting, relational, or computational definitions.&#x201D; <italic>Completeness</italic> computes &#x201C;features that describe the frequencies of data attributes present in a data set without reference to data values.&#x201D; <italic>Plausibility</italic> describes &#x201C;the believability or truthfulness of data values.&#x201D; The data quality assessment context <italic>verification</italic> is a strategy &#x201C;for the source of expectations or comparisons of EHR data based on internal characteristics&#x201D; [<xref ref-type="bibr" rid="ref43">43</xref>].</p><p>To test the relevance and usability of primary care data in the OMOP CDM, we compared the results of several queries of the OMOP CDM with the results obtained directly from the Weda software. The queries were run by a physician (CJ) who used the software in his clinical practice. To ensure that the patient records could be checked manually, the queries were chosen to keep the resulting number of patients low. Two queries corresponded to the MHC&#x2019;s general activity (eg, the number of patients per family physician), two corresponded to prescription data, and a fifth query corresponded to laboratory test data.</p></sec><sec id="s2-6"><title>Practical Application</title><p>Using RShiny and the <italic>shiny</italic>, <italic>shinyBS</italic>, <italic>shinycssloaders</italic>, <italic>shinydashboard</italic>, <italic>shinyjs,</italic> and <italic>shinyWidgets</italic> libraries, we implemented a dashboard to report the MHC&#x2019;s general activity, prescriptions, and the distribution of the laboratory test results [<xref ref-type="bibr" rid="ref44">44</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Data Extraction</title><p>The data were extracted in July 2021. The available patient profiles dated back to 1997, and data on clinical measurements, drug prescriptions, and laboratory tests were available from 2013 onward. The extracted data contained 18,395 patient files. Each patient&#x2019;s file contained anonymized demographic information (ie, sex, year of birth, the town or city of residence, and the country of residence), the date of the first consultation, and the name of the family physician with whom the patient was registered. It also contained the patient&#x2019;s medical history (documented with <italic>ICD-10</italic> codes or as free text), information related to the consultation, laboratory test results, and clinical reports from other physicians (also as free text).</p></sec><sec id="s3-2"><title>Transformation</title><sec id="s3-2-1"><title>Semantic Mapping</title><p>In all, 17 vocabularies were mapped (<xref ref-type="table" rid="table1">Table 1</xref>).</p><p>All the new concepts were added to the CONCEPT table (n=10,221). These primary care concepts were added alongside the existing concepts in the OMOP model developed by OHDSI. The mapping between local concepts and standard concepts was integrated into the CONCEPT_RELATIONSHIP table (n=9432).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The concept mapping. When a local vocabulary is not given, it means that the concept had to be created.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Feature</td><td align="left" valign="bottom">Local vocabulary</td><td align="left" valign="bottom">OMOP<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> vocabulary</td><td align="left" valign="bottom">Level of mapping difficulty</td><td align="left" valign="bottom">Concepts, n</td><td align="left" valign="bottom">Mapped concepts, n/N (%)</td><td align="left" valign="bottom">Associated records, n/N (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Care site</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">Care site</td><td align="left" valign="top">Level 1</td><td align="left" valign="top">1</td><td align="left" valign="top">1/1 (100)</td><td align="left" valign="top">1/1 (100)</td></tr><tr><td align="left" valign="top">Medical histories</td><td align="left" valign="top"><italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top"><italic>ICD-10</italic></td><td align="left" valign="top">Level 1</td><td align="left" valign="top">83</td><td align="left" valign="top">80/83 (96.4)</td><td align="left" valign="top">2252/2315 (97.3)</td></tr><tr><td align="left" valign="top">Visit</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Visit</td><td align="left" valign="top">Level 1</td><td align="left" valign="top">2</td><td align="left" valign="top">2/2 (100)</td><td align="left" valign="top">592,226/592,226 (100)</td></tr><tr><td align="left" valign="top">Drug</td><td align="left" valign="top">ATC<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">RxNorm</td><td align="left" valign="top">Level 2</td><td align="left" valign="top">9070</td><td align="left" valign="top">9100/9100 (100)</td><td align="left" valign="top">684,805/684,805 (100)</td></tr><tr><td align="left" valign="top">Drug</td><td align="left" valign="top">CIP<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup> code</td><td align="left" valign="top">ATC</td><td align="left" valign="top">Level 3</td><td align="left" valign="top">9946</td><td align="left" valign="top">9100/9946 (91.5)</td><td align="left" valign="top">684,805/814,772 (84)</td></tr><tr><td align="left" valign="top">Biometric variables</td><td align="left" valign="top">Free text in structured fields</td><td align="left" valign="top">SNOMED<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">Level 3</td><td align="left" valign="top">243</td><td align="left" valign="top">12/243 (4.9)</td><td align="left" valign="top">172,549/179,337 (96.2)</td></tr><tr><td align="left" valign="top">Laboratory test variables</td><td align="left" valign="top">Free text in structured fields</td><td align="left" valign="top">LOINC<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">Level 3</td><td align="left" valign="top">2312</td><td align="left" valign="top">170/2312 (7.4)</td><td align="left" valign="top">829,498/941,522 (88.1)</td></tr><tr><td align="left" valign="top">Measurement units</td><td align="left" valign="top">Free text in structured fields</td><td align="left" valign="top">UCUM<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">Level 3</td><td align="left" valign="top">217</td><td align="left" valign="top">65/217 (30)</td><td align="left" valign="top">863,259/1,120,859 (77)<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td></tr><tr><td align="left" valign="top">Patient characteristics</td><td align="left" valign="top">Free text in structured fields</td><td align="left" valign="top">Sex</td><td align="left" valign="top">Level 3</td><td align="left" valign="top">2</td><td align="left" valign="top">2/2 (100)</td><td align="left" valign="top">18,395/18,395 (100)</td></tr><tr><td align="left" valign="top">Outcome (diagnosis)</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Consultation (reason)</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Examination (measure taken)</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Clinical report by another physician</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Medical history</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Referrals</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Supplementary information</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Vaccine prescription</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Vaccination</td><td align="left" valign="top">Free text</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Level 4</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>OMOP: Observational Medical Outcomes Partnership.</p></fn><fn id="table1fn2"><p><sup>b</sup>Not applicable.</p></fn><fn id="table1fn3"><p><sup>c</sup><italic>ICD-10: International Classification of Diseases, 10th Revision.</italic></p></fn><fn id="table1fn4"><p><sup>d</sup>ATC: Anatomical Therapeutic Chemical.</p></fn><fn id="table1fn5"><p><sup>e</sup>CIP: <italic>Code Identifiant de Sp&#x00E9;cialit&#x00E9;</italic> (the French national drug code).</p></fn><fn id="table1fn6"><p><sup>f</sup>SNOMED: Systematized Nomenclature of Medicine.</p></fn><fn id="table1fn7"><p><sup>g</sup>LOINC: Logical Observation Identifiers Names and Codes.</p></fn><fn id="table1fn8"><p><sup>h</sup>UCUM: Unified Code for Units of Measure.</p></fn><fn id="table1fn9"><p><sup>i</sup>23% (257,801/1,120,859) not available.</p></fn></table-wrap-foot></table-wrap><p>More than 80% (9100/9946, 91.5%) of the drug records and more than 90% (80/83, 96.4%) of the <italic>ICD-10</italic>&#x2013;coded medical history records were mapped. Less than 4.9% (12/243) of the biometric measurement concepts were mapped; the latter accounted for 96.2% (172,549/179,337) of the records because a small number of concepts were used (eg, weight, height, and heart rate; <xref ref-type="table" rid="table1">Table 1</xref>). The remaining records were free-text and family physician&#x2013;dependent variables. The writing style can vary and the same variable can be asked in several ways. For example, to find out whether the patient is a smoker, the family physician can input the information in the family physician&#x2013;dependent variable &#x201C;does my patient smoke?&#x201D; &#x201C;is he a smoker?&#x201D; or &#x201C;do you smoke?&#x201D;</p><p>For level 3 mapping difficulties, drug-related concepts (coded as CIP codes) were mapped in two steps. RxNorm is the standard classification chosen by OHDSI for the OMOP model, and therefore, we had to map our local terminology (ie, CIP) to RxNorm. First, the CIP codes were mapped to the ATC codes. Second, the ATC codes were mapped to the RxNorm codes, using the correspondences already implemented in the CONCEPT_RELATIONSHIP table.</p><p>With regard to the laboratory test variables, the cleaning step reduced the number of concepts from 3003 to 2312. We restricted the mapping to the most frequently cited laboratory test concepts in the MEASUREMENT table, with the aim of covering more than 80% of the records. Disagreements over laboratory test concept mapping by experts were resolved by consensus and the involvement of a third annotator. The experts disagreed about 24.3% (37/152) of the mapped concepts, which corresponds to a &#x03BA; score of 75%.</p></sec><sec id="s3-2-2"><title>Structural Mapping</title><p>Several XML tables in the source model corresponded to tables in the OMOP CDM format (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Information about the patient, the family physician, the profile creation date, and the health care center was stored in the PERSON, PROVIDER, OBSERVATION_PERIOD, and CARE_SITE tables, respectively. The medical history (documented with <italic>ICD-10</italic> codes) was stored in the OBSERVATION table. Each consultation at the health care center corresponded to a record in the VISIT_OCCURRENCE table, identified by a visit_concept_id (A<italic>mbulatory Primary Care Clinic/Center</italic>; concept_id=38004247). Biometric measurements were stored in the MEASUREMENT table, with a concept type corresponding to <italic>EHR physical examination</italic>. Laboratory test results were stored in the MEASUREMENT table, with a concept type <italic>Lab</italic> (concept_id=32,856). The feature measurement_source_type_id distinguishes each source table (laboratory data or biometrics measurements). Each drug prescription was stored in the DRUG_EXPOSURE table. Free-text information collected during the consultation was stored in the NOTE table with an appropriate source vocabulary concept identifier (eg, a note of clinical signs; the reason for the consultation; medical histories; the outcome of the consultation; and, in some cases, the associated diagnosis). Medical reports from a specialist physician not based in the MHC were recorded in the NOTE table (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><p>All the standard concept types used to identify information in the various source tables are detailed in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>; for example, the NOTE table contains information about the reason for the consultation, the patient&#x2019;s medical history, and other medical reports.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Structural mapping of each source variable to the OMOP CDM format. Common Data Model; OMOP: Observational Medical Outcomes Partnership.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e49542_fig02.png"/></fig></sec></sec><sec id="s3-3"><title>Data Loading and Quality Assessments</title><p>Records spanning 20 years (592,226 consultations by 18,395 patients) were integrated into the OMOP CDM. The numbers of records per OMOP table before and after the ETL process and the related computing time are reported (<xref ref-type="table" rid="table2">Table 2</xref>). The CARE_SITE and DRUG_ERA tables were implemented using data transformed into the OMOP format.</p><p>The Atlas Server dashboard produced the data distributions for each table. An example of the distribution of blood potassium concentrations is shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p><p>The Atlas dashboard&#x2019;s overview tab provided a top-level summary of the total number of passes and failures by Kahn category (<xref ref-type="fig" rid="figure3">Figure 3</xref>). We found 28 <italic>Conformance</italic> failures that did not respect the specifications of the OMOP CDM. There were 21 <italic>Completeness</italic> failures related to potentially missing data and 23 failures related to <italic>Plausibility</italic> for implausible dates or measurement values. For each of these failures, the results tab (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>) displayed one line per <italic>verification</italic>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>The volume of each table before and after the ETL<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> process and the associated computing time.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">OMOP<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> tables</td><td align="left" valign="bottom">Records before the ETL process, n</td><td align="left" valign="bottom">Records after ETL process, n</td><td align="left" valign="bottom">Computing time (s)</td><td align="left" valign="bottom">Local tables</td></tr></thead><tbody><tr><td align="left" valign="top">CARE_SITE</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">1</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">DEATH</td><td align="left" valign="top">419</td><td align="left" valign="top">419</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">Death</td></tr><tr><td align="left" valign="top">DRUG_ERA</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1,084,012</td><td align="left" valign="top">3.75</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">DRUG_EXPOSURE</td><td align="left" valign="top">924,216</td><td align="left" valign="top">814,772</td><td align="left" valign="top">4.54</td><td align="left" valign="top">Drug</td></tr><tr><td align="left" valign="top">LOCATION</td><td align="left" valign="top">19,662</td><td align="left" valign="top">11,433</td><td align="left" valign="top">0.01</td><td align="left" valign="top">Address</td></tr><tr><td align="left" valign="top">MEASUREMENT</td><td align="left" valign="top">1,120,859</td><td align="left" valign="top">1,120,859</td><td align="left" valign="top">225.76</td><td align="left" valign="top">Biometrics and laboratory test</td></tr><tr><td align="left" valign="top">NOTE</td><td align="left" valign="top">2,772,809</td><td align="left" valign="top">2,091,705</td><td align="left" valign="top">4.57</td><td align="left" valign="top">Referrals, consultations, diagnoses, clinical reports from outside the MHC<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>, medical history, additional information, and vaccination status</td></tr><tr><td align="left" valign="top">OBSERVATION</td><td align="left" valign="top">64,669</td><td align="left" valign="top">2315</td><td align="left" valign="top">0.16</td><td align="left" valign="top">Medical history</td></tr><tr><td align="left" valign="top">OBSERVATION_PERIOD</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">18,256</td><td align="left" valign="top">0.01</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">PERSON</td><td align="left" valign="top">18,395</td><td align="left" valign="top">18,395</td><td align="left" valign="top">0.04</td><td align="left" valign="top">Patient</td></tr><tr><td align="left" valign="top">PROVIDER</td><td align="left" valign="top">8</td><td align="left" valign="top">8</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient</td></tr><tr><td align="left" valign="top">VISIT_OCCURRENCE</td><td align="left" valign="top">592,227</td><td align="left" valign="top">592,226</td><td align="left" valign="top">1.54</td><td align="left" valign="top">Consultation</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ETL: extract-transform-load.</p></fn><fn id="table2fn2"><p><sup>b</sup>OMOP: Observational Medical Outcomes Partnership.</p></fn><fn id="table2fn3"><p><sup>c</sup>Not applicable.</p></fn><fn id="table2fn4"><p><sup>d</sup>MHC: multidisciplinary health center.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>The data quality assessment dashboard. NA: not available.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e49542_fig03.png"/></fig><p>The concordance of results obtained from data quality evaluation queries between the source EHRs and the data warehouse&#x2019;s records proved that the process was reliable (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). In the event of a difference between the two (results obtained from the data warehouse in OMOP format and results from the Weda software), we had to check the patient records in the software to identify what the correct figure was. Patients whose profile had been created after 2021 had to be removed from the results produced by the Weda software because the extraction data (stored in the data warehouse) goes up to June 2021 at the latest, and queries on the software interface allow filtering for the entire year. The family physician must declare when he or she became the patient&#x2019;s referring family physician. This family physician declaration is dated in the Weda software. This date is not found in the data warehouse. The date of the patient&#x2019;s registration with the family physician was also taken into account in the queries; registrations after the extraction date were removed. Queries concerning the laboratory test results were checked manually by one of the MHC&#x2019;s family physicians (CJ). Some laboratory test results were saved in the &#x201C;reports&#x201D; part and others were saved in the &#x201C;consultations&#x201D; part on the software.</p></sec><sec id="s3-4"><title>Practical Application</title><p>A 3-tab prototype dashboard was implemented (<xref ref-type="fig" rid="figure4">Figure 4</xref>). The first tab concerned the MHC&#x2019;s activity, the second concerned drug prescriptions, and the third concerned laboratory test results.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>The prototype primary care dashboard. PriCaDa: Primary Care Data Warehouse.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e49542_fig04.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we implemented primary care data into the OMOP CDM format from a French health care facility. Five concepts related to the consultation (reason for the consultation, diagnosis, and comments), the clinical report by another physician, some medical histories, referrals, and vaccination data in free text were stored in the NOTE table, and three structured free-text concepts were mapped to standard concepts (laboratory test results, biometrics, and measurement units). Overall, we included 592,226 consultations and 10,221 concepts over 20 years, including 9432 mappings between local concepts and standard concepts. The concept mapping was validated by three experts, including a family physician. We then used queries to validated the design of the OMOP CDM by comparing the results obtained in our data warehouse with those obtained in the source software.</p><p>The OMOP model was originally developed to answer pharmaco-epidemiologic questions by reference to hospital databases or claims databases. New types of data have since been integrated, such as those in the fields of cancer, microbiology, and anesthesia [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Integrating these new data types might present difficulties not foreseen in the original CDM. Integrating primary care data required the addition of 10,221 new concepts. Through the sharing of tools and methods, the OMOP model enables reproducible analyses of decentralized data [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref46">46</xref>].</p></sec><sec id="s4-2"><title>Comparison With Previous Work</title><p>This work stands out for its integration of out-of-hospital clinical data over a long time period. In contrast to the French national health care database (<italic>Syst&#x00E8;me National des Donn&#x00E9;es de Sant&#x00E9;</italic>), we included clinical data. Similarly, the data produced by French hospital included test results from the hospital&#x2019;s laboratory only. We were able to load data from outpatient treatments and out-of-hospital medical laboratories into the OMOP model; in France, these data are not documented in claims and hospital databases. We also have data on drug prescriptions and associated dosage (duration of treatment, number of refills, number of drugs per dose, and dosing period), whereas the <italic>Syst&#x00E8;me National des Donn&#x00E9;es de Sant&#x00E9;</italic> only contains data on prescription fulfillment.</p><p>By using a CDM, we will be able to share our work with other primary care data reuse initiatives [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>This study had a number of strengths. First, it was based on collaboration between data scientists and family physicians. Each data transformation step was approved by the MHC&#x2019;s family physicians. Second, working with the EHR software&#x2019;s developer enabled us to understand the software&#x2019;s structure and export format. The involvement of the software developer in the study expedited the data extraction process. This collaboration with the software developer allowed us to retrieve the data in XML format, comprehend each of the XML tags, and discern the origin of the XML information within the software. Third, our development of a dashboard gave health care professionals an overview of their practice in terms of the number of patients followed and the number of consultations carried out over a defined period.</p></sec><sec id="s4-3"><title>Limitations</title><p>The first limitation is that a large proportion of the extracted primary care data had been entered as free text and required NLP methods or manual examination to be used secondarily. Moreover, the primary care EHR software provides information on drug prescriptions but not on filling or patient compliance.</p><p>The free text was difficult to map. Although the most frequent codes were mapped, further mapping and information extraction are needed. NLP methods might be able to recover the free-text information on the diagnosis established during the consultation and the symptoms mentioned.</p></sec><sec id="s4-4"><title>Perspective</title><p>The next step in the project will involve sharing the ETL process with other health care facilities equipped with Weda software or other software. A qualitative study during the presentation of the dashboard to the health care professionals might improve the prototype dashboard and identify unmet needs for further development. This extension will provide us with an opportunity to conduct multicenter studies and to integrate data from other professions working in primary care (such as nurses, midwives, physiotherapists, and pharmacists).</p></sec><sec id="s4-5"><title>Conclusion</title><p>We implemented primary care data from a French health care facility into the OMOP CDM format. Data concerning demographics, units, measurements, and primary care consultation steps were already available in the OHDSI vocabularies. Laboratory test results and drug prescription data were mapped with the available vocabulary and structured in the final model. However, the free text in the primary care EHR software complicates the reuse of additional clinical information such as diagnoses, symptoms, clinical reports, and reasons for consultation. A dashboard application provided health care professionals with feedback on their practice.</p></sec></sec></body><back><ack><p>We thank Dr David Fraser (Biotech Communication SARL, Ploudalm&#x00E9;zeau, France) for editorial assistance and helpful advice. The research was funded by the French government through the GIRCI Nord-Ouest program (GIRCI is a French abbreviation for "interregional groups for clinical research and innovation"; project: &#x201C;REsP-IR&#x201D;). The funding bodies did not participate in the design of this study; its execution, analyses, interpretation of the data; or the decision to submit the results.</p></ack><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ATC</term><def><p>Anatomical Therapeutic Chemical</p></def></def-item><def-item><term id="abb2">CDM</term><def><p>common data model</p></def></def-item><def-item><term id="abb3">CIP</term><def><p><italic>Code Identifiant de Sp&#x00E9;cialit&#x00E9;</italic> (the French national drug code)</p></def></def-item><def-item><term id="abb4">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb5">ETL</term><def><p>extract-transform-load</p></def></def-item><def-item><term id="abb6"><italic>ICD-10</italic></term><def><p><italic>International Classification of Diseases, 10th Revision</italic></p></def></def-item><def-item><term id="abb7">MHC</term><def><p>multidisciplinary health center</p></def></def-item><def-item><term id="abb8">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb9">OHDSI</term><def><p>Observational Health Data Sciences and Informatics</p></def></def-item><def-item><term id="abb10">OMOP</term><def><p>Observational Medical Outcomes Partnership</p></def></def-item><def-item><term id="abb11">PriCaDa</term><def><p>Primary Care Data Warehouse</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schoen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Osborn</surname><given-names>R</given-names> </name><name name-style="western"><surname>Squires</surname><given-names>D</given-names> </name><etal/></person-group><article-title>A survey of primary care doctors in ten countries shows progress in use of health information technology, less in other areas</article-title><source>Health Aff (Millwood)</source><year>2012</year><month>12</month><volume>31</volume><issue>12</issue><fpage>2805</fpage><lpage>2816</lpage><pub-id pub-id-type="doi">10.1377/hlthaff.2012.0884</pub-id><pub-id pub-id-type="medline">23154997</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meystre</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lovis</surname><given-names>C</given-names> </name><name name-style="western"><surname>B&#x00FC;rkle</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tognola</surname><given-names>G</given-names> </name><name name-style="western"><surname>Budrionis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lehmann</surname><given-names>CU</given-names> </name></person-group><article-title>Clinical data reuse or secondary use: current status and potential future progress</article-title><source>Yearb Med Inform</source><year>2017</year><month>08</month><volume>26</volume><issue>1</issue><fpage>38</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.15265/IY-2017-007</pub-id><pub-id pub-id-type="medline">28480475</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jannot</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Zapletal</surname><given-names>E</given-names> </name><name name-style="western"><surname>Avillach</surname><given-names>P</given-names> </name><name name-style="western"><surname>Mamzer</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Burgun</surname><given-names>A</given-names> </name><name name-style="western"><surname>Degoulet</surname><given-names>P</given-names> </name></person-group><article-title>The Georges Pompidou University Hospital clinical data warehouse: a 8-years follow-up experience</article-title><source>Int J Med Inform</source><year>2017</year><month>06</month><volume>102</volume><fpage>21</fpage><lpage>28</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2017.02.006</pub-id><pub-id pub-id-type="medline">28495345</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Men&#x00E9;ndez Torre</surname><given-names>EL</given-names> </name><name name-style="western"><surname>Ares Blanco</surname><given-names>J</given-names> </name><name name-style="western"><surname>Conde Barreiro</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rojo Mart&#x00ED;nez</surname><given-names>G</given-names> </name><name name-style="western"><surname>Delgado Alvarez</surname><given-names>E</given-names> </name><collab>en representaci&#x00F3;n del Grupo de Epidemiolog&#x00ED;a de la Sociedad Espa&#x00F1;ola de Diabetes (SED)</collab></person-group><article-title>Prevalence of diabetes mellitus in Spain in 2016 according to the Primary Care Clinical Database (BDCAP)</article-title><source>Endocrinol Diabetes Nutr (Engl Ed)</source><year>2021</year><month>02</month><volume>68</volume><issue>2</issue><fpage>109</fpage><lpage>115</lpage><pub-id pub-id-type="doi">10.1016/j.endinu.2019.12.004</pub-id><pub-id pub-id-type="medline">32988801</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lamer</surname><given-names>A</given-names> </name><name name-style="western"><surname>Moussa</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Marcilly</surname><given-names>R</given-names> </name><name name-style="western"><surname>Logier</surname><given-names>R</given-names> </name><name name-style="western"><surname>Vallet</surname><given-names>B</given-names> </name><name name-style="western"><surname>Tavernier</surname><given-names>B</given-names> </name></person-group><article-title>Development and usage of an anesthesia data warehouse: lessons learnt from a 10-year project</article-title><source>J Clin Monit Comput</source><year>2023</year><month>04</month><volume>37</volume><issue>2</issue><fpage>461</fpage><lpage>472</lpage><pub-id pub-id-type="doi">10.1007/s10877-022-00898-y</pub-id><pub-id pub-id-type="medline">35933465</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><article-title>Primary care</article-title><source>NHS Digital</source><access-date>2023-07-31</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://digital.nhs.uk/data-and-information/areas-of-interest/primary-care">https://digital.nhs.uk/data-and-information/areas-of-interest/primary-care</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="book"><person-group person-group-type="author"><collab>Institute of Medicine (US) Committee on the Future of Primary Care</collab></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Donaldson</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Yordy</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Lohr</surname><given-names>KN</given-names> </name><etal/></person-group><article-title>Defining primary care</article-title><source>Primary Care: America&#x2019;s Health in a New Era</source><year>1996</year><access-date>2023-07-31</access-date><publisher-name>National Academies Press (US)</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK232631/">https://www.ncbi.nlm.nih.gov/books/NBK232631/</ext-link></comment></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gentil</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Cuggia</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fiquet</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Factors influencing the development of primary care data collection projects from electronic health records: a systematic review of the literature</article-title><source>BMC Med Inform Decis Mak</source><year>2017</year><month>09</month><day>25</day><volume>17</volume><issue>1</issue><fpage>139</fpage><pub-id pub-id-type="doi">10.1186/s12911-017-0538-x</pub-id><pub-id pub-id-type="medline">28946908</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Danciu</surname><given-names>I</given-names> </name><name name-style="western"><surname>Cowan</surname><given-names>JD</given-names> </name><name name-style="western"><surname>Basford</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Secondary use of clinical data: the Vanderbilt approach</article-title><source>J Biomed Inform</source><year>2014</year><month>12</month><volume>52</volume><fpage>28</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2014.02.003</pub-id><pub-id pub-id-type="medline">24534443</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Coorevits</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sundgren</surname><given-names>M</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>GO</given-names> </name><etal/></person-group><article-title>Electronic health records: new opportunities for clinical research</article-title><source>J Intern Med</source><year>2013</year><month>12</month><volume>274</volume><issue>6</issue><fpage>547</fpage><lpage>560</lpage><pub-id pub-id-type="doi">10.1111/joim.12119</pub-id><pub-id pub-id-type="medline">23952476</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Muller</surname><given-names>S</given-names> </name></person-group><article-title>Electronic medical records: the way forward for primary care research?</article-title><source>Fam Pract</source><year>2014</year><month>04</month><volume>31</volume><issue>2</issue><fpage>127</fpage><lpage>129</lpage><pub-id pub-id-type="doi">10.1093/fampra/cmu009</pub-id><pub-id pub-id-type="medline">24627543</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Carey</surname><given-names>IM</given-names> </name><name name-style="western"><surname>Banchoff</surname><given-names>E</given-names> </name><name name-style="western"><surname>Nirmalananthan</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Prevalence and incidence of neuromuscular conditions in the UK between 2000 and 2019: a retrospective study using primary care data</article-title><source>PLoS One</source><year>2021</year><month>12</month><day>31</day><volume>16</volume><issue>12</issue><fpage>e0261983</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0261983</pub-id><pub-id pub-id-type="medline">34972157</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boullenger</surname><given-names>L</given-names> </name><name name-style="western"><surname>Quindroit</surname><given-names>P</given-names> </name><name name-style="western"><surname>Legrand</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Type 2 diabetics followed up by family physicians: treatment sequences and changes over time in weight and glycated hemoglobin, prim</article-title><source>Prim Care Diabetes</source><year>2022</year><month>10</month><volume>16</volume><issue>5</issue><fpage>670</fpage><lpage>676</lpage><pub-id pub-id-type="doi">10.1016/j.pcd.2022.07.002</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Loadsman</surname><given-names>MEN</given-names> </name><name name-style="western"><surname>Verheij</surname><given-names>TJM</given-names> </name><name name-style="western"><surname>van der Velden</surname><given-names>AW</given-names> </name></person-group><article-title>Impetigo incidence and treatment: a retrospective study of Dutch routine primary care data</article-title><source>Fam Pract</source><year>2019</year><month>07</month><day>31</day><volume>36</volume><issue>4</issue><fpage>410</fpage><lpage>416</lpage><pub-id pub-id-type="doi">10.1093/fampra/cmy104</pub-id><pub-id pub-id-type="medline">30346521</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marwaha</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dusendang</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Alexeeff</surname><given-names>SE</given-names> </name><etal/></person-group><article-title>Comanagement of rashes by primary care providers and dermatologists: a retrospective study</article-title><source>Perm J</source><year>2021</year><month>12</month><day>13</day><volume>25</volume><fpage>20.320</fpage><pub-id pub-id-type="doi">10.7812/TPP/20.320</pub-id><pub-id pub-id-type="medline">35348083</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Milea</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yeo</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Nam</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Long-acting bronchodilator use in chronic obstructive pulmonary disease in primary care in New Zealand: a retrospective study of treatment patterns and evolution using the HealthStat database</article-title><source>Int J Chron Obstruct Pulmon Dis</source><year>2021</year><month>04</month><day>20</day><volume>16</volume><fpage>1075</fpage><lpage>1091</lpage><pub-id pub-id-type="doi">10.2147/COPD.S290887</pub-id><pub-id pub-id-type="medline">33907394</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sollie</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sijmons</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Helsper</surname><given-names>C</given-names> </name><name name-style="western"><surname>Numans</surname><given-names>ME</given-names> </name></person-group><article-title>Reusability of coded data in the primary care electronic medical record: a dynamic cohort study concerning cancer diagnoses</article-title><source>Int J Med Inform</source><year>2017</year><month>03</month><volume>99</volume><fpage>45</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.08.004</pub-id><pub-id pub-id-type="medline">28118921</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kornf&#x00E4;lt Isberg</surname><given-names>H</given-names> </name><name name-style="western"><surname>Hedin</surname><given-names>K</given-names> </name><name name-style="western"><surname>Melander</surname><given-names>E</given-names> </name><name name-style="western"><surname>M&#x00F6;lstad</surname><given-names>S</given-names> </name><name name-style="western"><surname>Beckman</surname><given-names>A</given-names> </name></person-group><article-title>Increased adherence to treatment guidelines in patients with urinary tract infection in primary care: a retrospective study</article-title><source>PLoS One</source><year>2019</year><month>03</month><day>28</day><volume>14</volume><issue>3</issue><fpage>e0214572</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0214572</pub-id><pub-id pub-id-type="medline">30921411</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fruchart</surname><given-names>M</given-names> </name><name name-style="western"><surname>Quindroit</surname><given-names>P</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>H</given-names> </name><name name-style="western"><surname>Beuscart</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Calafiore</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lamer</surname><given-names>A</given-names> </name></person-group><article-title>Implementation of a data warehouse in primary care: first analyses with elderly patients</article-title><source>Stud Health Technol Inform</source><year>2022</year><month>05</month><day>25</day><volume>294</volume><fpage>505</fpage><lpage>509</lpage><pub-id pub-id-type="doi">10.3233/SHTI220510</pub-id><pub-id pub-id-type="medline">35612131</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><source>Clinical Practice Research Datalink (CPRD)</source><access-date>2023-05-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cprd.com/node/120">https://www.cprd.com/node/120</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><source>The Health Improvement Network (THIN)</source><access-date>2023-05-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.the-health-improvement-network.com">https://www.the-health-improvement-network.com</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="web"><article-title>Corporate Data Warehouse (CDW)</article-title><source>US Department of Veterans Affairs</source><access-date>2023-05-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.hsrd.research.va.gov/for_researchers/cdw.cfm">https://www.hsrd.research.va.gov/for_researchers/cdw.cfm</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="web"><source>Canadian Primary Care Sentinel Surveillance Network (CPCSSN)</source><access-date>2023-05-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://cpcssn.ca/">https://cpcssn.ca/</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Safran</surname><given-names>C</given-names> </name></person-group><article-title>Reuse of clinical data</article-title><source>Yearb Med Inform</source><year>2014</year><month>08</month><day>15</day><volume>9</volume><issue>1</issue><fpage>52</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.15265/IY-2014-0013</pub-id><pub-id pub-id-type="medline">25123722</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weiskopf</surname><given-names>NG</given-names> </name><name name-style="western"><surname>Weng</surname><given-names>C</given-names> </name></person-group><article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title><source>J Am Med Inform Assoc</source><year>2013</year><month>01</month><day>1</day><volume>20</volume><issue>1</issue><fpage>144</fpage><lpage>151</lpage><pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id><pub-id pub-id-type="medline">22733976</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pascoe</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Neal</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Heywood</surname><given-names>PL</given-names> </name><name name-style="western"><surname>Allgar</surname><given-names>VL</given-names> </name><name name-style="western"><surname>Miles</surname><given-names>JN</given-names> </name><name name-style="western"><surname>Stefoski-Mikeljevic</surname><given-names>J</given-names> </name></person-group><article-title>Identifying patients with a cancer diagnosis using general practice medical records and cancer registry data</article-title><source>Fam Pract</source><year>2008</year><month>08</month><volume>25</volume><issue>4</issue><fpage>215</fpage><lpage>220</lpage><pub-id pub-id-type="doi">10.1093/fampra/cmn023</pub-id><pub-id pub-id-type="medline">18550895</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Terry</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Stewart</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cejic</surname><given-names>S</given-names> </name><etal/></person-group><article-title>A basic model for assessing primary health care electronic medical record data quality</article-title><source>BMC Med Inform Decis Mak</source><year>2019</year><month>02</month><day>12</day><volume>19</volume><issue>1</issue><fpage>30</fpage><pub-id pub-id-type="doi">10.1186/s12911-019-0740-0</pub-id><pub-id pub-id-type="medline">30755205</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Papez</surname><given-names>V</given-names> </name><name name-style="western"><surname>Moinat</surname><given-names>M</given-names> </name><name name-style="western"><surname>Voss</surname><given-names>EA</given-names> </name><etal/></person-group><article-title>Transforming and evaluating the UK Biobank to the OMOP common data model for COVID-19 research and beyond</article-title><source>J Am Med Inform Assoc</source><year>2022</year><month>12</month><day>13</day><volume>30</volume><issue>1</issue><fpage>103</fpage><lpage>111</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocac203</pub-id><pub-id pub-id-type="medline">36227072</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hripcsak</surname><given-names>G</given-names> </name><name name-style="western"><surname>Duke</surname><given-names>JD</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>NH</given-names> </name><etal/></person-group><article-title>Observational Health Data Sciences and Informatics (OHDSI): opportunities for observational researchers</article-title><source>Stud Health Technol Inform</source><year>2015</year><volume>216</volume><fpage>574</fpage><lpage>578</lpage><pub-id pub-id-type="medline">26262116</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><source>Observational Health Data Sciences and Informatics (OHDSI)</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ohdsi.org/">https://www.ohdsi.org/</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>OMOP CDM v5.4</article-title><source>OHDSI GitHub</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ohdsi.github.io/CommonDataModel/cdm54.html">https://ohdsi.github.io/CommonDataModel/cdm54.html</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="web"><article-title>OMOP Standardized Vocabulary V5.0</article-title><source>Observational Health Data Sciences and Informatics (OHDSI)</source><access-date>2022-07-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ohdsi.org/web/wiki/doku.php?id=documentation:vocabulary">https://www.ohdsi.org/web/wiki/doku.php?id=documentation:vocabulary</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lamer</surname><given-names>A</given-names> </name><name name-style="western"><surname>Abou-Arab</surname><given-names>O</given-names> </name><name name-style="western"><surname>Bourgeois</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Transforming anesthesia data into the Observational Medical Outcomes Partnership common data model: development and usability study</article-title><source>J Med Internet Res</source><year>2021</year><month>10</month><day>29</day><volume>23</volume><issue>10</issue><fpage>e29259</fpage><pub-id pub-id-type="doi">10.2196/29259</pub-id><pub-id pub-id-type="medline">34714250</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paris</surname><given-names>N</given-names> </name><name name-style="western"><surname>Lamer</surname><given-names>A</given-names> </name><name name-style="western"><surname>Parrot</surname><given-names>A</given-names> </name></person-group><article-title>Transformation and evaluation of the MIMIC database in the OMOP common data model: development and usability study</article-title><source>JMIR Med Inform</source><year>2021</year><month>12</month><day>14</day><volume>9</volume><issue>12</issue><fpage>e30970</fpage><pub-id pub-id-type="doi">10.2196/30970</pub-id><pub-id pub-id-type="medline">34904958</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haberson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rinner</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sch&#x00F6;berl</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gall</surname><given-names>W</given-names> </name></person-group><article-title>Feasibility of mapping Austrian health claims data to the OMOP common data model</article-title><source>J Med Syst</source><year>2019</year><month>09</month><day>7</day><volume>43</volume><issue>10</issue><fpage>314</fpage><pub-id pub-id-type="doi">10.1007/s10916-019-1436-9</pub-id><pub-id pub-id-type="medline">31494719</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="web"><source>Weda</source><access-date>2023-09-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://weda.fr/">https://weda.fr/</ext-link></comment></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="web"><article-title>White Rabbit</article-title><source>OHDSI GitHub</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://ohdsi.github.io/WhiteRabbit/WhiteRabbit.html">http://ohdsi.github.io/WhiteRabbit/WhiteRabbit.html</ext-link></comment></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="web"><article-title>Rabbit in a Hat</article-title><source>OHDSI GitHub</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://ohdsi.github.io/WhiteRabbit/RabbitInAHat.html">http://ohdsi.github.io/WhiteRabbit/RabbitInAHat.html</ext-link></comment></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lemaire</surname><given-names>F</given-names> </name></person-group><article-title>The Jard&#x00E9; law: what does change [Article in French]</article-title><source>Presse Med</source><year>2019</year><month>03</month><volume>48</volume><issue>3 Pt 1</issue><fpage>238</fpage><lpage>242</lpage><pub-id pub-id-type="doi">10.1016/j.lpm.2019.01.006</pub-id><pub-id pub-id-type="medline">30853280</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><article-title>Athena</article-title><source>Observational Health Data Sciences and Informatics (OHDSI)</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://athena.ohdsi.org/search-terms/start">https://athena.ohdsi.org/search-terms/start</ext-link></comment></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cohen</surname><given-names>J</given-names> </name></person-group><article-title>A coefficient of agreement for nominal scales</article-title><source>Educ Psychol Meas</source><year>1960</year><month>04</month><volume>20</volume><issue>1</issue><fpage>37</fpage><lpage>46</lpage><pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="web"><article-title>ATLAS</article-title><source>Observational Health Data Sciences and Informatics (OHDSI)</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://atlas-demo.ohdsi.org/">https://atlas-demo.ohdsi.org/</ext-link></comment></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kahn</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Callahan</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Barnard</surname><given-names>J</given-names> </name><etal/></person-group><article-title>A harmonized data quality assessment terminology and framework for the secondary use of electronic health record data</article-title><source>EGEMS (Wash DC)</source><year>2016</year><month>09</month><day>11</day><volume>4</volume><issue>1</issue><fpage>1244</fpage><pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id><pub-id pub-id-type="medline">27713905</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="web"><article-title>Shinydashboard</article-title><source>Rstudio GitHub</source><access-date>2023-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://rstudio.github.io/shinydashboard/">https://rstudio.github.io/shinydashboard/</ext-link></comment></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yoon</surname><given-names>E</given-names> </name><name name-style="western"><surname>Boo</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Transforming thyroid cancer diagnosis and staging information from unstructured reports to the Observational Medical Outcome Partnership Common Data Model</article-title><source>Appl Clin Inform</source><year>2022</year><month>05</month><volume>13</volume><issue>3</issue><fpage>521</fpage><lpage>531</lpage><pub-id pub-id-type="medline">35705182</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Delanerolle</surname><given-names>G</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>R</given-names> </name><name name-style="western"><surname>Stipancic</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Methodological issues in using a common data model of COVID-19 vaccine uptake and important adverse events of interest: feasibility study of data and connectivity COVID-19 vaccines pharmacovigilance in the United Kingdom</article-title><source>JMIR Form Res</source><year>2022</year><month>08</month><day>22</day><volume>6</volume><issue>8</issue><fpage>e37821</fpage><pub-id pub-id-type="doi">10.2196/37821</pub-id><pub-id pub-id-type="medline">35786634</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Standard concept types for each source table.</p><media xlink:href="medinform_v12i1e49542_app1.doc" xlink:title="DOC File, 39 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>The distribution of the blood potassium concentration values on the Achilles dashboard on the Atlas server.</p><media xlink:href="medinform_v12i1e49542_app2.png" xlink:title="PNG File, 139 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Results of the data quality assessment dashboard for each feature.</p><media xlink:href="medinform_v12i1e49542_app3.png" xlink:title="PNG File, 149 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>List of quality requests and the associated SQL codes.</p><media xlink:href="medinform_v12i1e49542_app4.doc" xlink:title="DOC File, 27 KB"/></supplementary-material></app-group></back></article>