<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v14i1e81254</article-id>
      <article-id pub-id-type="pmid">41802234</article-id>
      <article-id pub-id-type="doi">10.2196/81254</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Harmonizing Logical Observation Identifiers Names and Codes (LOINC) Codes and Units in Real-World Oncology Data: Method Development and Evaluation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Famotire</surname>
            <given-names>Akinwale</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Dixon</surname>
            <given-names>Brian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Naliyatthaliyazchayil</surname>
            <given-names>Parvati</given-names>
          </name>
          <degrees>PharmD, MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution/>
            <institution>ConcertAI, LLC</institution>
            <addr-line>1120 Massachusetts Ave.</addr-line>
            <addr-line>Cambridge, MA, 02138</addr-line>
            <country>United States</country>
            <phone>1 317 985 7429</phone>
            <email>parumenon.pm@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-5917-4558</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Stenerson</surname>
            <given-names>Travis</given-names>
          </name>
          <degrees>MHI, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-5128-7574</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>ConcertAI, LLC</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Parvati Naliyatthaliyazchayil <email>parumenon.pm@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>9</day>
        <month>3</month>
        <year>2026</year>
      </pub-date>
      <volume>14</volume>
      <elocation-id>e81254</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>7</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>11</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>1</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>2</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Parvati Naliyatthaliyazchayil, Travis Stenerson. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 09.03.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2026/1/e81254" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The expanding use of multisource real-world electronic health record (EHR) and claims data offers major opportunities for research, drug discovery, and clinical decision support. While standards such as Logical Observation Identifiers Names and Codes (LOINC) can ensure semantic interoperability for laboratory observations, clinical documents, and other clinical terms, properly assigning these concepts remains a challenge. Studies show that 6% to 19% of laboratory tests cannot be accurately mapped to LOINC. Existing systems try to address this challenge but often depend on source data strings and other input features that may be absent, null, or incorrect. This underscores the need for a scalable approach to correct LOINC code assignments, standardize units, and ensure data integrity across multisource laboratory data.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This paper presents a universally applicable framework that identifies and corrects observable errors in quantitative laboratory results coded to LOINC and the Systematized Nomenclature of Medicine for the unit of measure without relying on raw source data strings. The process seeks to improve the accuracy, conformance, consistency, and completeness of laboratory data while maintaining complete provenance.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The proposed framework uses a 2-step process. First, LOINC codes are corrected using the associated unit of measure. Second, units are adjusted or populated to match a preferred unit for that LOINC code. In both steps, the quantitative result is checked against a predefined acceptable range to determine validity. The process is driven by 3 knowledge tables. The framework is applied to datasets derived from the ConcertAI database of approximately 10 million patients with cancer, evaluating improvements in LOINC code–unit conformance and unit completeness. Analyses are performed on 4 independently LOINC-coded datasets: the full ConcertAI dataset and 3 high-volume diverse subsets grouped by data source or EHR vendor.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 428 LOINC codes were observed across 6.34 billion records in the ConcertAI database. All 4 datasets were processed using the proposed framework. Before applying the framework, 73.1% (4,634,610,173/6,337,101,453) of records in the ConcertAI dataset had correctly assigned units based on the laboratory reasonable range table; after application, this increased to 99.7% (6,322,375,200/6,341,230,213). Similar improvements were observed across the 3 EHR-specific datasets, increasing from 78.5% (691,315,390/880,250,137) to 99.8% (879,626,472/881,157,852; source 1), 71.4% (2,132,455,936/2,985,465,124) to 99.8% (2,982,319,644/2,988,173,959; source 2), and 63.3% (2,936,710,502/4,640,432,294) to 99.6% (4,618,714,114/4,638,862,412; source 3). Unit completeness also improved substantially, increasing from 92.7% (5,879,071,858/6,341,230,213) to 99.8% (6,331,923,060/6,341,230,213) in the ConcertAI dataset and from 92.5% (814,867,241/881,157,852) to 100% (880,816,133/881,157,852), 94.4% (2,822,107,252/2,988,173,959) to 99.9% (2,986,624,027/2,988,173,959), and 91.7% (4,254,054,966/4,638,862,412) to 99.8% (4,632,935,919/4,638,862,412) in sources 1 to 3, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Laboratory data quality is crucial in oncology systems for therapy selection, monitoring, and disease progression assessment. This proposed solution is a first-of-its-kind, system-agnostic, and scalable normalization process that addresses key gaps in laboratory data quality across multiple dimensions.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>real-world data</kwd>
        <kwd>laboratory data</kwd>
        <kwd>harmonization</kwd>
        <kwd>standardization</kwd>
        <kwd>oncology</kwd>
        <kwd>health care system</kwd>
        <kwd>electronic health record</kwd>
        <kwd>multisourced data</kwd>
        <kwd>structured data</kwd>
        <kwd>mapping</kwd>
        <kwd>Fast Healthcare Interoperability Resources</kwd>
        <kwd>FHIR</kwd>
        <kwd>Logical Observation Identifiers Names and Codes</kwd>
        <kwd>LOINC</kwd>
        <kwd>Systematized Nomenclature of Medicine</kwd>
        <kwd>SNOMED</kwd>
        <kwd>unit conversion</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background: Real-World Data in Health Care</title>
        <p>Multisourced, comprehensive patient health data have seen a recent rise in prominence and utility in supporting research, drug discovery, pharmacovigilance, and clinical decision support [<xref ref-type="bibr" rid="ref1">1</xref>]. These real-world data (RWD) are collected for individual patient care and reimbursement in often unconnected systems such as electronic health records (EHRs) and claims clearing houses [<xref ref-type="bibr" rid="ref2">2</xref>]. Secondary use of RWD holds immense potential for improving health due to its volume, variety, and ubiquity [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>The different source systems producing RWD bring individual challenges and opportunities, and it is often necessary to stitch together disparate sources to cover a complete patient journey [<xref ref-type="bibr" rid="ref3">3</xref>]. For instance, medical claims may contain procedures and tests performed on a patient and their associated costs, but the results of those tests are only present in the EHR [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      </sec>
      <sec>
        <title>Data Quality and Semantic Interoperability Challenges</title>
        <p>The path to a usable RWD dataset is fraught with challenges [<xref ref-type="bibr" rid="ref2">2</xref>]. Errors can arise from any system or actor that generates, transmits, transforms, or persists the data during its lifetime [<xref ref-type="bibr" rid="ref5">5</xref>]. Errors can be discernible from patterns observed in the data or can be hidden from downstream users when information is lost [<xref ref-type="bibr" rid="ref6">6</xref>]. Information loss can result in incorrectness or missingness of variables, records, tables, or complete data sources [<xref ref-type="bibr" rid="ref7">7</xref>]. Monitoring and minimizing information loss is a critical requirement of an RWD pipeline.</p>
        <p>Semantic interoperability (SI), or the ability to ensure the same meaning and interpretation of data shared between systems [<xref ref-type="bibr" rid="ref8">8</xref>], is a well-established and ongoing challenge in RWD [<xref ref-type="bibr" rid="ref5">5</xref>]. It can manifest as redundant representations of the same concept, such as one EHR using the <italic>International Classification of Diseases, 10th Revision, Clinical Modification</italic>, and another using the Systematized Nomenclature of Medicine (SNOMED) to represent the same disease. Use of data standards and common ontologies can alleviate SI challenges but can also introduce errors if used incorrectly [<xref ref-type="bibr" rid="ref5">5</xref>], which can commonly occur when a concept is assigned to a string by either a human or machine [<xref ref-type="bibr" rid="ref9">9</xref>]. As health care data systems continue to evolve, the importance of SI is underscored by the increasing adoption of standards such as Fast Healthcare Interoperability Resources (FHIR) [<xref ref-type="bibr" rid="ref10">10</xref>] with its associated code system bindings supported by the Food and Drug Administration, which are designed to ensure consistent data interpretation and improve interoperability across systems. Even FHIR-based representations may fall short in fully addressing semantic mismatches, particularly for complex domains such as laboratory data, in which variability in coding, units, and local conventions persists despite standardization efforts [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
      </sec>
      <sec>
        <title>Laboratory Data and Logical Observation Identifiers Names and Codes Mapping Challenges</title>
        <p>Laboratory result data are both valuable and particularly challenging in RWD [<xref ref-type="bibr" rid="ref9">9</xref>]. To address SI, laboratory data primarily rely on codes from the Logical Observation Identifiers Names and Codes (LOINC) code system [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. LOINC is the dominant global coding system for laboratory concepts but also extends to a broader range of clinical terms, including clinical questions and documents [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. LOINC consists of concepts that have 6 attributes each. These include the analyte tested, how it is observed, the duration of observation, and the sample type that the observation is performed on [<xref ref-type="bibr" rid="ref13">13</xref>]. Precoordinating that much information into a single concept makes it convenient for transmission by reducing the potential for misinterpretation but also makes it difficult to use when mapping to LOINC [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. The complete information for LOINC mapping is rarely present in a single string, column, or record [<xref ref-type="bibr" rid="ref15">15</xref>]. Relevant information may be spread across one or more fields in a record or laboratory information system, such as the observation’s display string (eg, glucose), the data type of the result (numeric or categorical), the unit of measure (mass over volume or molarity), the associated order name or panel name (complete blood count or urinalysis), the associated sample (urine or blood), the device or equipment used to make the observation (urine dipstick or continuous glucose monitor), or other observations that occurred as part of the same panel of tests (Is the patient fasting?). Despite the abundance of resources, accurately translating these fields to the correct LOINC code remains a challenge.</p>
        <p>This semantic and translational complexity means that laboratory results in RWD can frequently present with errors introduced during terminology binding to LOINC [<xref ref-type="bibr" rid="ref16">16</xref>]. Prior studies have shown that LOINC codes could not be assigned for 6% to 19% of laboratory tests due to incomplete or incorrect information [<xref ref-type="bibr" rid="ref17">17</xref>]. Systems have been proposed to reduce this error by coding via automated means in RWD [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>] and clinical trial data [<xref ref-type="bibr" rid="ref19">19</xref>]. These algorithms rely on source data strings and other input features that may be absent, null, or observably incorrect.</p>
      </sec>
      <sec>
        <title>Unit of Measure and Normalization Challenges</title>
        <p>The diversity of information required for LOINC mapping increases the likelihood of mapping difficulty [<xref ref-type="bibr" rid="ref20">20</xref>] and significant information loss. If a result’s unit of measure is absent or recorded in the wrong place or the associated panel name, order name, or sample type is missing from the data, it can mean insufficient information to properly assign the LOINC code [<xref ref-type="bibr" rid="ref15">15</xref>]. Contextually appropriate filling in of absent units of measure has been shown to be effective in a system that extracts logical expressions from clinical trial inclusion criteria pertaining to quantitative laboratory results but not within RWD [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <p>A laboratory result may present with a correct concept code, but it is possible to represent the same result using multiple scales (g or mg), and certain units are used interchangeably between sources (mg per day or mg per 24 hours). Unit normalization is necessary to ensure comparable results during data analysis and aggregation, and the variety of representation, the missingness, and the level of incorrectness can all lead to loss of utility of RWD. Even with a correct LOINC code, missing or inconsistent units have been shown to affect as much as 14% of laboratory records in some systems [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Mechanisms to normalize synonymous units exist, but these techniques do not handle situations in which the unit is incomplete, incorrect, or completely absent [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      </sec>
      <sec>
        <title>Proposed Framework and Objective: Correcting Quantitative Laboratory Results</title>
        <p>In this paper, we present a framework to identify and correct observable errors in quantitative laboratory results that have already been coded to LOINC for the observation and SNOMED for the unit of measure without reliance on source data strings. This 2-step process first adjusts the LOINC code by using information contained in the associated unit of measure. Next, we use the quantitative result to inform whether we can safely populate a missing unit of measure or correct an erroneous unit of measure. Finally, all synonymous or related units are normalized to a single preselected unit for each LOINC code. We characterize the prevalence of these errors and then use this framework to correct laboratory results in a multisource RWD pipeline of oncology patient data from EHRs, laboratory information systems, and medical claims.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>This section outlines the data collection and study design used to develop this framework.</p>
      <sec>
        <title>Data Collection</title>
        <p>Laboratory result data were extracted from the ConcertAI database, a US-based, deidentified, patient-level dataset from approximately 10 million patients with cancer aged ≥18 years during the period from 2015 to 2025. The data used in this study were sourced from EHRs, including oncology practices, hospitals, and academic medical centers. To evaluate the framework, we analyzed 4 laboratory datasets: the full ConcertAI database and 3 subsets corresponding to the individual EHR sources (represented as source 1, source 2, and source 3) that transmitted data to ConcertAI. These 3 subsets were selected because they were the top contributors of laboratory data by volume and represented a broad diversity of laboratory tests. Specifically, the ConcertAI database accounted for 6.34 billion records, source 1 included 880 million records, source 2 included 2.98 billion records, and source 3 included 4.64 billion records.</p>
        <p>Data were contributed by multiple clinical sites and laboratories across the United States, representing a diverse group of care settings. Each dataset was standardized using LOINC codes for laboratory observations and SNOMED codes for units of measure. For records from the full ConcertAI database, LOINC codification was performed using ConcertAI’s internal system; for EHR or data source–derived subsets, the LOINC codes that were delivered with those data were used. Only records with a numeric value were used in this study. All datasets used ConcertAI’s unit codification that maps unit strings to SNOMED.</p>
      </sec>
      <sec>
        <title>System Design</title>
        <p>The laboratory correction framework was applied after standardization to LOINC and SNOMED. The laboratory correction system relies on 3 knowledge tables that have been manually created after careful examination of the ConcertAI laboratory data, as outlined below. Their role in supporting the logical framework is discussed later in this section. Below, we provide the formal definitions of these tables, including their constituent fields and primary keys. The procedures used to create each table and the column definitions are documented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>The LOINC conversion map (LCM) relates a LOINC concept and unit concept that are incongruous to a new LOINC code that is compatible with the unit of measure. The table structure incorporates the following computable fields: “old_loinc_code,” “old_loinc_display,” “old_loinc_system,” “unit_code,” “unit_display,” “unit_system,” “new_loinc_code,” “new_loinc_display,” and “new_loinc_system.” The primary key for the table is defined as the composite of “old_loinc_code” and “unit_code.” Examples are shown in <xref ref-type="table" rid="table1">Table 1</xref>, which has been formatted for readability. The complete computable version is available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and in the accompanying GitHub repository to support transparency and reproducibility.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Logical Observation Identifiers Names and Codes (LOINC) conversion map.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="420"/>
            <col width="200"/>
            <col width="380"/>
            <thead>
              <tr valign="bottom">
                <td>LOINC code</td>
                <td>Unit (SNOMED<sup>a</sup>)</td>
                <td>Corrected LOINC code</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Platelets (#/volume) in blood (26515-7)</td>
                <td>fL (258775009)</td>
                <td>Platelet (entitic mean volume) in blood (28542-9)</td>
              </tr>
              <tr valign="top">
                <td>Glucose (mass/volume) in blood (26515-7)</td>
                <td>mEq/L (258865000)</td>
                <td>Glucose (moles/volume) in blood (15074-8)</td>
              </tr>
              <tr valign="top">
                <td>Glucose (mass/volume) in blood (26515-7)</td>
                <td>mmol/L (258813002)</td>
                <td>Glucose (moles/volume) in blood (15074-8)</td>
              </tr>
              <tr valign="top">
                <td>Kappa light chains (mass/volume) in serum or plasma (11050-2)</td>
                <td>Percentage (118582008)</td>
                <td>Kappa lymphocytes/lymphocytes in blood (17096-9)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>SNOMED: Systematized Nomenclature of Medicine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The reasonable range map defines metadata about a single LOINC code, including its assigned correct unit of measure, a minimum and maximum value that the laboratory test can reasonably take, and the mean and median of records with that LOINC code and unit across all 4 datasets. The correct unit of measure for each LOINC code was determined using the “example_unit” supplied in the official LOINC distribution. These units were mapped to the corresponding SNOMED codes. For LOINC codes that listed more than one example unit, we examined the empirical distribution of units observed in our dataset and selected the unit with the highest frequency. This made the choice of the correct unit data driven and ensured that the process could be consistently reproduced in any system. If Unified Code for Units of Measure (UCUM) units are preferred, LOINC also provides “example_ucum_units,” which can be incorporated similarly. Minimum and maximum reasonable values for each LOINC code were defined by estimating the empirical distribution of the data through quantiles of 0.005, 0.025, 0.16, 0.5 (median), 0.84, 0.975, and 0.995. The range was set at or near the highest and lowest of those quantiles, providing broad yet data-anchored thresholds for plausibility checking.</p>
        <p>This knowledge table includes the following computable fields: “loinc_code, loinc_name,” “unit_code,” “unit_name,” “min_reasonable,” “max_reasonable,” “mean,” and “median.” The primary key for this table is the “loinc_code.” A readability-optimized version is shown in <xref ref-type="table" rid="table2">Table 2</xref>, whereas the complete computable version is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and the GitHub repository.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Reasonable range map.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="380"/>
            <col width="250"/>
            <col width="170"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="bottom">
                <td>LOINC<sup>a</sup> code</td>
                <td>Unit (SNOMED<sup>b</sup>)</td>
                <td>Reasonable range</td>
                <td>Median</td>
                <td>Mean</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Platelets (#/volume) in blood (26515-7)</td>
                <td>×10(3)/mcL (1287856009)</td>
                <td>1-800</td>
                <td>223.5</td>
                <td>215.0</td>
              </tr>
              <tr valign="top">
                <td>Glucose (mass/volume) in blood (2339-0)</td>
                <td>mg/dL (258797006)</td>
                <td>40-400</td>
                <td>138.8</td>
                <td>121</td>
              </tr>
              <tr valign="top">
                <td>Kappa light chains (mass/volume) in serum or plasma (11050-2)</td>
                <td>mg/L (258796002)</td>
                <td>0.1-5000</td>
                <td>68.7</td>
                <td>25.9</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>LOINC: Logical Observation Identifiers Names and Codes.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>SNOMED: Systematized Nomenclature of Medicine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The unit multiplier map relates a correct unit to a synonymous, convertible, or incorrect unit along with a multiplier value, an additive scalar value, and a description of the relationship between the 2 units (eg, incorrect, synonym, or convertible). The scalar value is only used for temperature conversions. An empty “incorrect unit” represents a null unit field and is used to populate absent units. This knowledge table includes the following computable fields: “incorrect_unit_code,” “incorrect_unit_name,” “correct_unit_code,” “correct_unit_name,” “multiplier,” “scalar_constant,” and “multiplier_type.” The primary key is the composite of “incorrect_unit_code,” “correct_unit_code,” and “multiplier_type.” A readability-optimized version is shown in <xref ref-type="table" rid="table3">Table 3</xref>, with the full computable version available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and the GitHub repository.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Unit multiplier map.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="230"/>
            <col width="250"/>
            <col width="130"/>
            <col width="90"/>
            <col width="300"/>
            <thead>
              <tr valign="bottom">
                <td>Incorrect unit (SNOMED<sup>a</sup>)</td>
                <td>Correct unit (SNOMED)</td>
                <td>Multiplier</td>
                <td>Scalar</td>
                <td>Multiplier type (description)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>&lt;null&gt;</td>
                <td>×10(3)/mcL (1287856009)</td>
                <td>1</td>
                <td>0</td>
                <td>“nullfill” (unit absent)</td>
              </tr>
              <tr valign="top">
                <td>10*9/L (277288007)</td>
                <td>×10(3)/mcL (1287856009)</td>
                <td>1</td>
                <td>0</td>
                <td>“synonym”</td>
              </tr>
              <tr valign="top">
                <td>cells/µL (258878000)</td>
                <td>×10(3)/mcL (1287856009)</td>
                <td>0.001</td>
                <td>0</td>
                <td>“unit_conversion” (convertible unit)</td>
              </tr>
              <tr valign="top">
                <td>cells/µL (258878000)</td>
                <td>×10(3)/mcL (1287856009)</td>
                <td>1</td>
                <td>0</td>
                <td>“unit_typo” (known unit error)</td>
              </tr>
              <tr valign="top">
                <td>g/dL (258795003)</td>
                <td>mg/dL (258797006)</td>
                <td>1000</td>
                <td>0</td>
                <td>“unit_conversion” (convertible unit)</td>
              </tr>
              <tr valign="top">
                <td>g/dL (258795003)</td>
                <td>mg/dL (258797006)</td>
                <td>1</td>
                <td>0</td>
                <td>“unit_typo” (known unit error)</td>
              </tr>
              <tr valign="top">
                <td>g/L (258794004)</td>
                <td>mg/dL (258797006)</td>
                <td>1</td>
                <td>0</td>
                <td>“unit_conversion” (convertible unit)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>SNOMED: Systematized Nomenclature of Medicine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The framework logic is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Conformance to the selected “correct” unit is checked against the laboratory reasonable range (LRR) table entry. If the unit does not conform, the LCM provides a better LOINC code if one is known for the unit that is present in the record. In the second transformation, the unit is altered according to the unit multiplier map, normalized if it is a synonym, converted using a multiplier value, or swapped for the correct unit if it is a known error pattern or absent altogether. For example, the LOINC code 1920-8 (glucose [mass/volume] in blood) has the correct unit “mg/dL.” If a record with this LOINC code has the unit “mmol/L,” the LOINC code is changed using the LCM to 15074-8 (glucose [moles/volume] in blood). The process is only 2 steps, although not all records require both. Records may begin with LOINC code–unit conformance and skip the process altogether. Some require only LOINC conversion, some require only unit normalization, and many require LOINC conversion and then unit normalization.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Framework logic and knowledge table use. LCM: Logical Observation Identifiers Names and Codes (LOINC) conversion map; LRR: laboratory reasonable range; SNOMED: Systematized Nomenclature of Medicine; UMM: unit multiplier map.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e81254_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Each of these transformations only proceeds when the record’s result value falls within the reasonable range associated with the LOINC code–unit pair that would appear in the transformed record. These ranges were selected using known correct data and designed to capture most possible values in that laboratory’s value distribution.</p>
        <p>In rare instances, the system must select between 2 possible transformations for the same record. This might occur in the situation visible in rows 5 and 6 in <xref ref-type="table" rid="table3">Table 3</xref> when trying to convert from g/dL to mg/dL. We identified a common error in many records in which a unit’s prefix was absent. A g/dL unit might be a simple data entry error at the source, or it may, in fact, require conversion by multiplying the result by 1000. The system uses the reasonable ranges to determine which of these 2 situations is more likely. If the reasonable ranges are not disparate enough to discern which transformation is required, proximity to the median of the target LOINC code–unit’s distribution is compared. The transformation resulting in a record closer to that median is selected. If the compared laboratory results have medians of 0, distance from the mean is used.</p>
        <p>To evaluate the success of each transformation, the value distribution of the output for any individual transformation was compared with the value distribution of known correct data with that LOINC code–unit pair. If the distribution of the numeric result of the transformed data matched that of known correct data, it was considered successful. If the distribution did not match, the discrepancy was investigated. These investigations led to the discovery of common error patterns that could then be accounted for in the next iteration by adding to the 3 knowledge tables.</p>
        <p>To summarize, the precedence of the rules described above is as follows:</p>
        <list list-type="order">
          <list-item>
            <p>LRR conformance check—if the LOINC code–unit pair conforms to the LRR table, no transformation is applied.</p>
          </list-item>
          <list-item>
            <p>LOINC conversion (LCM)—if the unit is incompatible with the LOINC code, the framework first selects the appropriate LOINC code.</p>
          </list-item>
          <list-item>
            <p>Unit normalization or conversion (unit multiplier map)—after the LOINC code is finalized, unit normalization or conversion is applied.</p>
          </list-item>
          <list-item>
            <p>Range validation—a transformation is only accepted if the resulting value falls within the target LOINC code’s reasonable range.</p>
          </list-item>
          <list-item>
            <p>Conflict resolution—when more than one unit transformation falls within the reasonable range, the system resolves this by checking proximity to the median of the known correct distribution or proximity to the mean when the distribution median is 0.</p>
          </list-item>
        </list>
        <p>A few examples of LOINC code–unit incongruencies and framework processing are outlined in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>Provenance is maintained within each transformed record in an attribute that acts as a ledger of each transformation that alters that record. This attribute is an array of objects that includes a descriptive string that details what features of the record were adjusted and what features were used to justify that adjustment for human readability. For computability, “object” includes the adjusted attribute names and preadjustment values for those attributes, ensuring transparency to downstream users and reversibility if necessary.</p>
        <p>A summary of the steps for this framework is illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> shows an example of LOINC code–unit pairs before transformation, each step of the transformation, and the final output after transformation.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Summary of the framework. LOINC: Logical Observation Identifiers Names and Codes; SNOMED: Systematized Nomenclature of Medicine.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e81254_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Example of Logical Observation Identifiers Names and Codes (LOINC) code–unit pairs before and after transformation.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e81254_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study used retrospective, deidentified data collected for clinical purposes. All data were fully anonymized before analysis, and unique patient identifiers were removed. Analysis of deidentified secondary data does not constitute human subjects research and does not require formal review or approval by an institutional review board, and thus, no institutional review board approval number was sought. Because only deidentified data were used, informed consent from individual patients was not required. Privacy and confidentiality were maintained throughout the study in accordance with all applicable regulations.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Dataset Collection: Overview and LOINC Coverage</title>
        <p>All 4 sets of laboratory data underwent the LOINC code and unit correction process, and the proportion of records exhibiting each LOINC code–unit pattern was calculated both before and after the framework execution. A total of 428 LOINC codes were included in this study, chosen based on their prevalence in the ConcertAI database. Not all datasets contained all 428 LOINC codes. These LOINC codes accounted for 6.34 billion records in the ConcertAI database and 880 million, 2.98 billion, and 4.64 billion records in the source-specific datasets from sources 1, 2, and 3, respectively.</p>
      </sec>
      <sec>
        <title>System Design</title>
        <sec>
          <title>Impact of Framework on Unit Correction</title>
          <p>Before the application of the framework, 73.1% (4,634,610,173/6,337,101,453) records in the ConcertAI dataset with these LOINC codes had the correct unit as assigned by the LRR table. Following the application, this increased to 99.7% (6,322,375,200/6,341,230,213) of records. A similar trend was observed in each of the EHR-specific datasets: 78.5% (691,315,390/880,250,137) to 99.8% (879,626,472/881,157,852), 71.4% (2,132,455,936/2,985,465,124) to 99.8% (2,982,319,644/2,988,173,959), and 63.3% (2,936,710,502/4,640,432,294) to 99.6% (4,618,714,114/4,638,862,412) for sources 1, 2, and 3, respectively. The system increased the completion rate of units, defined as the proportion of records with nonmissing units, from 92.7% (5,879,071,858/6,341,230,213) to 99.8% (6,331,923,060/6,341,230,213) in the ConcertAI dataset and similarly in the other 3 datasets: 92.5% (814,867,241/881,157,852) to 100.0% (880,816,133/881,157,852), 94.4% (2,822,107,252/2,988,173,959) to 99.9% (2,986,624,027/2,988,173,959), and 91.7% (4,254,054,966/4,638,862,412) to 99.9% (4,632,935,919/4,638,862,412) for sources 1, 2, and 3, respectively. Because the framework assigns validated units to previously missing values, improvements in the correct unit rate reflect both corrections to misassigned units and the assignment of correct units to previously missing entries. As a result, the correct unit and completion rate metrics are related but not redundant: the correct unit rate captures accuracy among all populated units, whereas the completion rate captures overall presence of any unit.</p>
        </sec>
        <sec>
          <title>LOINC-Level Quality Threshold</title>
          <p>Not all LOINC codes start with the same degree of incorrectness. To evaluate the proportion of LOINC codes that reached specific data quality thresholds before and after framework application, records with each LOINC code were evaluated for unit correctness, and the number of LOINC codes passing certain unit correctness proportion thresholds was counted. These counts for each dataset are shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>. Of the 428 LOINC codes, the number meeting the 99% threshold of unit correctness in the full ConcertAI dataset increased from 125 (29.2%) to 370 (86.4%). Similar improvements were observed across the 3 source datasets, which contained different total proportions of evaluated LOINC codes: 83.9% (359/428) of LOINC codes in source 1, a total of 93.2% (399/428) of LOINC codes in source 2, and 88.6% (379/428) of LOINC codes in source 3. In source 1, the proportion meeting the 99% threshold increased from 42.9% (154/359) to 86.4% (310/359); in source 2, it increased from 30.8% (123/399) to 87.7% (350/399); and in source 3, it increased from 16.9% (64/379) to 79.7% (302/379).</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Number of Logical Observation Identifiers Names and Codes (LOINC)–coded records meeting unit correctness thresholds.</p>
            </caption>
            <graphic xlink:href="medinform_v14i1e81254_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Illustrative Subset Analysis</title>
          <p>To provide a more detailed view of the framework’s impact, <xref rid="figure5" ref-type="fig">Figure 5</xref> presents a closer look at 20 specific LOINC codes. These codes were selected for their varied domains and types of incongruencies in the starting data.</p>
          <p>Records with each of these 20 LOINC codes had their unit classified as correct, synonymous to correct, absent, or incorrect. Incorrect units were subclassified as incorrect and suggestive of a LOINC change, incorrect but convertible to the correct unit through a multiplier, or incorrect but not convertible. These unit categories represent the types of errors that this system is designed to correct. The proportions in each category were calculated before and after the framework application and are shown in <xref rid="figure5" ref-type="fig">Figure 5</xref> for each system.</p>
          <p>A detailed report showing the proportion of correctness for each LOINC code across all 4 datasets before and after the framework application is available in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Error type proportions for specific Logical Observation Identifiers Names and Codes (LOINC) codes. GFR: glomerular filtration rate; HPF: high power field; MDRD: Modification of Diet in Renal Disease; SA: surface area; WBC: white blood cell.</p>
            </caption>
            <graphic xlink:href="medinform_v14i1e81254_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The proposed normalization framework significantly improved LOINC code–unit congruence and unit absentia across all evaluated datasets, demonstrating generalizability to any clinical data system using standard medical terminologies for observation and unit representation. The method improved LOINC code–unit congruence overall in the ConcertAI laboratory dataset from 73.1% (4,634,610,173/6,337,101,453) to 99.7% (6,322,375,200/6,341,230,213), with similar trends in the other 3 data sources. The method and knowledge tables were developed using the ConcertAI data and applied to these independent datasets to demonstrate generalizability. To the best of our knowledge, this framework is the first of its kind to address 2 key gaps: the absence of a system-agnostic process for cleaning multisource laboratory data for secondary use [<xref ref-type="bibr" rid="ref18">18</xref>] and an approach tailored to RWD. RWD, where data quality is both challenging [<xref ref-type="bibr" rid="ref25">25</xref>] and critical to data usability, may lack source-specific semantics such as the local observation concept display name. This would impede the use of a standardization process designed to take advantage of those strings [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      </sec>
      <sec>
        <title>Mechanism of Framework</title>
        <p>The process, driven by 3 small, shareable knowledge tables, uses the observation concept (LOINC), the unit concept (SNOMED), and the numeric result as input. It first adjusts the LOINC code if the unit suggests a better LOINC code. It then normalizes the unit to a predetermined preferred unit for that LOINC code by filling null units, converting related units, or correcting units with overt errors. All transformations only proceed when the numeric result aligns with the predetermined distribution for the target LOINC code–unit pair. This “reasonable range” constraint addresses a shortcoming in existing proposed methodologies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] that handle units without consideration of the numeric result. This range can be used to flag records that fall outside the reasonable distribution for exclusion from analysis or closer review.</p>
      </sec>
      <sec>
        <title>Impact on Data Quality Dimensions</title>
        <p>Ensuring that laboratory values fall within a reasonable distribution contributes to accuracy, or the degree to which the data represent the true value of what is intended to be measured, and plausibility, 2 prominent dimensions [<xref ref-type="bibr" rid="ref25">25</xref>] of RWD quality. The results demonstrate improvements across a number of established quality dimensions [<xref ref-type="bibr" rid="ref25">25</xref>] other than accuracy and plausibility, including conformance, consistency, completeness, and provenance [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. The technique primarily addresses conformance to the approved LOINC code–unit pair set by the LRR table and consistency of semantic representation regardless of data source. Completeness is improved by populating the unit when null. This contextually appropriate population of absent units has not been addressed in prior studies of similar techniques [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>Data Provenance</title>
        <p>Data provenance is recognized as critical metadata for systems transmitting, storing, or using health data [<xref ref-type="bibr" rid="ref30">30</xref>]. Records in RWD pipelines may undergo many transformations on their path to integration into a single dataset, and these transformations must all be tracked to enable error correction and improve trustworthiness with downstream consumers. Data provenance has been defined in many ways [<xref ref-type="bibr" rid="ref31">31</xref>], and there are established specifications for recording provenance in health care data, such as the FHIR Provenance resource [<xref ref-type="bibr" rid="ref32">32</xref>] based on the World Wide Web Consortium provenance specification [<xref ref-type="bibr" rid="ref33">33</xref>]. Establishing the best method for provenance tracking within a system requires an assessment of the stakeholders for those data. The stakeholders for the transformations described in this paper were internal data analysts, informaticists, and quality assurance engineers. Provenance is maintained within each transformed record in an attribute that acts as a ledger of each transformation that altered that record. This attribute is an array of structures that include a descriptive, human-readable string detailing the transformation, as well as the altered attributes and preadjustment values that those attributes took. By consulting this array, transformations are fully reversible, original values are preserved, and a complete audit trail is available to support transparency and verification by downstream users.</p>
      </sec>
      <sec>
        <title>Clinical and Research Relevance</title>
        <p>Laboratory data quality and usability are critical in systems handling oncology data, where these results are used to select and monitor therapies and assess disease severity and progression [<xref ref-type="bibr" rid="ref34">34</xref>]. LOINC code–unit incongruence, unit absentia, and lack of unit standardization put an undue burden on any analyst or application attempting to use laboratory data for clinical decision support, retrospective studies, or clinical trial eligibility [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Improving unit completeness at the source is challenging because units are often inconsistently documented or transmitted in EHR systems [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Potential upstream improvements could include enforcing unit capture at the point of entry, not allowing free-text entry of units, ensuring consistent transmission in Health Level Seven and FHIR messages, or applying unit standardization at the health system level before data export. However, such approaches depend on local workflows and vendor configurations and cannot be guaranteed for multisource RWD. Consequently, postcodification harmonization frameworks such as the one described in this paper provide a practical and reproducible solution. The technique outlined in this paper presents a minimal set of logical steps to correct these problems within the pipeline of a multisourced data system handling RWD. Enforcing semantic consistency between LOINC and unit improves data usability [<xref ref-type="bibr" rid="ref24">24</xref>] but can also foster better data exchange [<xref ref-type="bibr" rid="ref39">39</xref>] between systems by reducing semantic differences. Ultimately, this framework ensures that laboratory data are both accurate and complete, enabling faster data-driven decisions that can enhance patient care, data exchange, clinical trials, and RWD analysis.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>The technique is presently limited by its capacity to correct the body system, which will reduce effectiveness for laboratory tests in which the potential body systems are relatively evenly distributed and share similar units when tested in either sample type. Information related to the body system can be present in the observation name but also in the panel name, the order name, discretely in another attribute in the laboratory result, or in other observations related to the result in question. Efforts are currently underway to evolve the process by incorporating panel or order-related information. The choice of SNOMED for unit may have been less ideal than UCUM [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], which is more flexible and more closely aligned with LOINC [<xref ref-type="bibr" rid="ref42">42</xref>], which suggests a UCUM unit for some of its concepts. The FHIR [<xref ref-type="bibr" rid="ref43">43</xref>] and Interoperability Standards Platform [<xref ref-type="bibr" rid="ref44">44</xref>] also suggest that UCUM be used to represent units. However, the framework is easily adaptable by simply replacing the SNOMED codes used in the knowledge tables with UCUM codes without requiring any further changes in script. In addition, the steps described in this paper specifically address quantitative LOINC codes and require modification to be applicable to qualitative scale–type LOINC codes. Another limitation is that the creation of the knowledge tables requires clinical and terminologist expertise to recognize errors and prepare the tables, as well as a large dataset to prepare laboratory value distributions. This framework is designed for secondary use in RWD, where inconsistencies, missing values, and heterogeneous coding practices complicate analysis, and is not intended for integration into direct point-of-care clinical decision-making. Therefore, its use does not pose any direct safety risk to patients. The harmonization of LOINC code–unit combinations and the potential flagging of outlier values can influence downstream analyses such as cohort definitions or outlier detection. It enables data analysts to use laboratory data that would otherwise have required a significant time investment to clean. The primary aim of these corrections is to reduce inconsistencies and facilitate reliable data aggregation for secondary research purposes. Future work will focus on integrating the framework with emerging technologies such as artificial intelligence.</p>
      </sec>
      <sec>
        <title>Practical Implementation</title>
        <p>To support practical implementation, we have released a starter kit supporting normalization of 146 LOINC codes from blood or serum, covering the “Hematology and cell counts” class and “Chemistry” glucose codes. It has 3 knowledge tables and an accompanying Python script available via a public GitHub repository [<xref ref-type="bibr" rid="ref45">45</xref>]. The knowledge tables incorporate LOINC and SNOMED, which are maintained in multiple languages, allowing the tables to be used with datasets in different linguistic contexts. The numeric values in the tables are language independent and do not require conversion, supporting their generalizability to different languages. The Python script executing the rules takes FHIR Observation resources as input, and 6 example resources are provided.</p>
        <p>Currently, the framework leverages SNOMED codes for units. However, the design is adaptable: implementers preferring UCUM codes can replace SNOMED codes with UCUM codes in the tables without any modification to the transformation script, allowing for seamless adoption of alternative unit standards. This flexibility ensures that the framework can be applied in diverse institutional or research contexts with minimal overhead.</p>
        <p>A key component of the framework is its structured provenance tracking, which records all transformations applied to each laboratory record in a way that allows the original data to be reconstructed if needed. For each modification, information such as the applied rule, details of the transformation, which fields were changed, the original values, and the reference values used in the conversion is systematically captured. Collectively, these elements enable full traceability, providing a clear lineage from the transformed value back to the original measurement. This approach not only supports reproducibility and auditing but also ensures transparency, allowing researchers and data analysts to confidently interpret and validate the standardized data while retaining the ability to recover the source information.</p>
        <p>By combining reproducible tables, adaptable unit standards, and robust provenance tracking, the framework provides a practical pathway for implementing consistent laboratory data harmonization in diverse settings while maintaining the transparency and traceability of each transformation.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>As the demand for multisourced RWD datasets grows, ensuring data quality and semantic consistency becomes increasingly vital. Persistent challenges regarding SI in laboratory data continue to limit the full potential of these data assets. Common issues include missing or incorrect units and misassigned LOINC codes, all of which can hinder integration and analysis. This framework addresses these challenges by systematically identifying and correcting discrepancies in quantitative laboratory data and has been shown to improve unit accuracy to above 99% for all evaluated datasets. It enables scalable, system-agnostic normalization of laboratory data, addressing critical gaps in several data quality dimensions. By improving laboratory data quality at the foundational level, it strengthens the reliability of RWD for data analysis, insight generation, and utility in software applications.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Detailed process for building the 3 knowledge tables described in system design, that is, the reasonable range map, unit multiplier map, and Logical Observation Identifiers Names and Codes conversion map.</p>
        <media xlink:href="medinform_v14i1e81254_app1.docx" xlink:title="DOCX File , 91 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Detailed report on the proportion of correct units before and after application of the framework, stratified by Logical Observation Identifiers Names and Codes code and by data source.</p>
        <media xlink:href="medinform_v14i1e81254_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 112 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">FHIR</term>
          <def>
            <p>Fast Healthcare Interoperability Resources</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LCM</term>
          <def>
            <p>Logical Observation Identifiers Names and Codes conversion map</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LOINC</term>
          <def>
            <p>Logical Observation Identifiers Names and Codes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LRR</term>
          <def>
            <p>laboratory reasonable range</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RWD</term>
          <def>
            <p>real-world data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SI</term>
          <def>
            <p>semantic interoperability</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SNOMED</term>
          <def>
            <p>Systematized Nomenclature of Medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">UCUM</term>
          <def>
            <p>Unified Code for Units of Measure</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to express their sincere gratitude to the ConcertAI reviewers Sheenu Chandwani, Jannette Hanna, Jennifer Rider, and Jocelyn Benson for their constructive feedback and insightful comments, which greatly enhanced the quality of this paper.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>ConcertAI, LLC, sponsored this study and provided financial support for the conduct of this research and preparation of this paper.</p>
      </sec>
    </notes>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated or analyzed during this study are not publicly available due to proprietary and licensing restrictions but may be available from ConcertAI, LLC, upon reasonable request and subject to applicable data use agreements and approval processes [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>PN and TS are employed by ConcertAI, LLC.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Di</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Multimodal integration in health care: development with applications in disease management</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>08</month>
          <day>21</day>
          <volume>27</volume>
          <fpage>e76557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e76557/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/76557</pub-id>
          <pub-id pub-id-type="medline">40840463</pub-id>
          <pub-id pub-id-type="pii">v27i1e76557</pub-id>
          <pub-id pub-id-type="pmcid">PMC12370271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Panagiotakos</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Real-world data: a brief review of the methods, applications, challenges and opportunities</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2022</year>
          <month>11</month>
          <day>05</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>287</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-022-01768-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-022-01768-6</pub-id>
          <pub-id pub-id-type="medline">36335315</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-022-01768-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC9636688</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Real-world evidence: a primer</article-title>
          <source>Pharmaceut Med</source>
          <year>2023</year>
          <month>01</month>
          <day>05</day>
          <volume>37</volume>
          <issue>1</issue>
          <fpage>25</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36604368"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40290-022-00456-6</pub-id>
          <pub-id pub-id-type="medline">36604368</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40290-022-00456-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC9815890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bock</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The benefit of using both claims data and electronic medical record data in health care analysis</article-title>
          <source>OPTUM</source>
          <year>2025</year>
          <access-date>2025-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.optum.com/content/dam/optum/resources/whitePapers/Benefits-of-using-both-claims-and-EMR-data-in-HC-analysis-WhitePaper-ACS.pdf">https://www.optum.com/content/dam/optum/resources/whitePapers/Benefits-of-using-both-claims-and-EMR-data-in-HC-analysis-WhitePaper-ACS.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>An</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Challenges for data quality in the clinical data life cycle: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>04</month>
          <day>23</day>
          <volume>27</volume>
          <fpage>e60709</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e60709/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/60709</pub-id>
          <pub-id pub-id-type="medline">40266662</pub-id>
          <pub-id pub-id-type="pii">v27i1e60709</pub-id>
          <pub-id pub-id-type="pmcid">PMC12059509</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abedjan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Papotti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Stonebraker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Detecting data errors: where are we and what needs to be done?</article-title>
          <source>Proc VLDB Endow</source>
          <year>2016</year>
          <month>08</month>
          <day>1</day>
          <volume>9</volume>
          <issue>12</issue>
          <fpage>993</fpage>
          <lpage>1004</lpage>
          <pub-id pub-id-type="doi">10.14778/2994509.2994518</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Munappy</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Bosch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Olsson</surname>
              <given-names>HH</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Morisio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Torchiano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jedlitschka</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data pipeline management in practice: challenges and opportunities</article-title>
          <source>Product-Focused Software Process Improvement</source>
          <year>2020</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>168</fpage>
          <lpage>84</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Mello</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Rigo</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>da Costa</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>da Rosa Righi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Donida</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bez</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Schunke</surname>
              <given-names>LC</given-names>
            </name>
          </person-group>
          <article-title>Semantic interoperability in health records standards: a systematic literature review</article-title>
          <source>Health Technol (Berl)</source>
          <year>2022</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>255</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35103230"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12553-022-00639-w</pub-id>
          <pub-id pub-id-type="medline">35103230</pub-id>
          <pub-id pub-id-type="pii">639</pub-id>
          <pub-id pub-id-type="pmcid">PMC8791650</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Warnekar</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Automated mapping of real-world oncology laboratory data to LOINC</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>611</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35308998"/>
          </comment>
          <pub-id pub-id-type="medline">35308998</pub-id>
          <pub-id pub-id-type="pii">3576978</pub-id>
          <pub-id pub-id-type="pmcid">PMC8861721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <article-title>FHIR® - Fast Healthcare Interoperability Resources®</article-title>
          <source>eCQI Resource Center</source>
          <access-date>2025-04-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ecqi.healthit.gov/fhir?qt-tabs_fhir=about">https://ecqi.healthit.gov/fhir?qt-tabs_fhir=about</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vorisek</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Lehne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Klopfenstein</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bartschke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haese</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Thun</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Fast Healthcare Interoperability Resources (FHIR) for interoperability in health research: systematic review</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>07</month>
          <day>19</day>
          <volume>10</volume>
          <issue>7</issue>
          <fpage>e35724</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/7/e35724/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35724</pub-id>
          <pub-id pub-id-type="medline">35852842</pub-id>
          <pub-id pub-id-type="pii">v10i7e35724</pub-id>
          <pub-id pub-id-type="pmcid">PMC9346559</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richesson</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Campion</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Knosp</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>LOINC implementation approaches in academic medical research centers - results from a survey of CTSA sites</article-title>
          <source>J Clin Transl Sci</source>
          <year>2025</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>e223</fpage>
          <pub-id pub-id-type="doi">10.1017/cts.2025.10151</pub-id>
          <pub-id pub-id-type="medline">41111944</pub-id>
          <pub-id pub-id-type="pii">S2059866125101519</pub-id>
          <pub-id pub-id-type="pmcid">PMC12529624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <source>LOINC</source>
          <access-date>2025-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://loinc.org">https://loinc.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Drenkhahn</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ingenerf</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The LOINC content model and its limitations of usage in the laboratory domain</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2020</year>
          <month>06</month>
          <day>16</day>
          <volume>270</volume>
          <fpage>437</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI200198</pub-id>
          <pub-id pub-id-type="medline">32570422</pub-id>
          <pub-id pub-id-type="pii">SHTI200198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Vreeman</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Huff</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Investigating the semantic interoperability of laboratory data exchanged using LOINC codes in three large institutions</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2011</year>
          <volume>2011</volume>
          <fpage>805</fpage>
          <lpage>14</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22195138"/>
          </comment>
          <pub-id pub-id-type="medline">22195138</pub-id>
          <pub-id pub-id-type="pmcid">PMC3243154</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fidahussein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vreeman</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>A corpus-based approach for automated LOINC mapping</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>64</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23676247"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001159</pub-id>
          <pub-id pub-id-type="medline">23676247</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2012-001159</pub-id>
          <pub-id pub-id-type="pmcid">PMC3912728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rosario</surname>
              <given-names>AC Jr</given-names>
            </name>
            <name name-style="western">
              <surname>Bertolli</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Standardizing laboratory data by mapping to LOINC</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2006</year>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>353</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/16501183"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1935</pub-id>
          <pub-id pub-id-type="medline">16501183</pub-id>
          <pub-id pub-id-type="pii">M1935</pub-id>
          <pub-id pub-id-type="pmcid">PMC1513656</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parr</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Shotwell</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Jeffery</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Lasko</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Matheny</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Automated mapping of laboratory tests to LOINC codes using noisy labels in a national electronic health record system database</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>10</month>
          <day>01</day>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>1292</fpage>
          <lpage>300</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30137378"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy110</pub-id>
          <pub-id pub-id-type="medline">30137378</pub-id>
          <pub-id pub-id-type="pii">5075874</pub-id>
          <pub-id pub-id-type="pmcid">PMC7646911</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>CZ</given-names>
            </name>
            <name name-style="western">
              <surname>Wales</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>Laboratory data standardization with SAS</article-title>
          <source>PharmaSUG</source>
          <year>2017</year>
          <access-date>2025-04-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pharmasug.org/proceedings/2017/AD/PharmaSUG-2017-AD10.pdf">https://pharmasug.org/proceedings/2017/AD/PharmaSUG-2017-AD10.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vreeman</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hook</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>BE</given-names>
            </name>
          </person-group>
          <article-title>Learning from the crowd while mapping to LOINC</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>11</month>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>1205</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26224334"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv098</pub-id>
          <pub-id pub-id-type="medline">26224334</pub-id>
          <pub-id pub-id-type="pii">ocv098</pub-id>
          <pub-id pub-id-type="pmcid">PMC4795577</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Valx: a system for extracting and structuring numeric lab test comparison statements from text</article-title>
          <source>Methods Inf Med</source>
          <year>2016</year>
          <month>05</month>
          <day>17</day>
          <volume>55</volume>
          <issue>3</issue>
          <fpage>266</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26940748"/>
          </comment>
          <pub-id pub-id-type="doi">10.3414/ME15-01-0112</pub-id>
          <pub-id pub-id-type="medline">26940748</pub-id>
          <pub-id pub-id-type="pii">15-01-0112</pub-id>
          <pub-id pub-id-type="pmcid">PMC5573874</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>Results final report</article-title>
          <source>AHRQ HCUP</source>
          <access-date>2025-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hcup-us.ahrq.gov/datainnovations/clinicaldata/3MSummaryResultsReportFinal.jsp">https://hcup-us.ahrq.gov/datainnovations/clinicaldata/3MSummaryResultsReportFinal.jsp</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abhyankar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>Standardizing clinical laboratory data for secondary use</article-title>
          <source>J Biomed Inform</source>
          <year>2012</year>
          <month>08</month>
          <volume>45</volume>
          <issue>4</issue>
          <fpage>642</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(12)00065-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2012.04.012</pub-id>
          <pub-id pub-id-type="medline">22561944</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(12)00065-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC3419308</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hauser</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Quine</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Ryder</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Unit conversions between LOINC codes</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>02</month>
          <day>01</day>
          <volume>25</volume>
          <issue>2</issue>
          <fpage>192</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28637208"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx056</pub-id>
          <pub-id pub-id-type="medline">28637208</pub-id>
          <pub-id pub-id-type="pii">3871185</pub-id>
          <pub-id pub-id-type="pmcid">PMC6251580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Castellanos</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Wittmershaus</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Chandwani</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Raising the bar for real-world data in oncology: approaches to quality across multiple dimensions</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2024</year>
          <month>01</month>
          <volume>8</volume>
          <fpage>e2300046</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38241599"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.23.00046</pub-id>
          <pub-id pub-id-type="medline">38241599</pub-id>
          <pub-id pub-id-type="pmcid">PMC10807898</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <article-title>Data quality framework for EU medicines regulation</article-title>
          <source>European Medicines Agency</source>
          <year>2023</year>
          <access-date>2025-04-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ema.europa.eu/en/documents/regulatory-procedural-guideline/data-quality-framework-eu-medicines-regulation_en.pdf">https://www.ema.europa.eu/en/documents/regulatory-procedural-guideline/data-quality-framework-eu-medicines-regulation_en.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>Real-world data: assessing electronic health records and medical claims data to support regulatory decision-making for drug and biological products</article-title>
          <source>U.S. Food &amp; Drug Administration</source>
          <year>2024</year>
          <month>7</month>
          <access-date>2025-04-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/real-world-data-assessing-electronic-health-records-and-medical-claims-data-support-regulatory">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/real-world-data-assessing-electronic-health-records-and-medical-claims-data-support-regulatory</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <article-title>NICE real-world evidence framework</article-title>
          <source>National Institute for Health and Care Excellence</source>
          <year>2022</year>
          <access-date>2025-04-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nice.org.uk/corporate/ecd9/chapter/assessing-data-suitability#assessing-data-suitability">https://www.nice.org.uk/corporate/ecd9/chapter/assessing-data-suitability#assessing-data-suitability</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daniel</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Silcox</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bryan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Characterizing RWD quality and relevancy for regulatory purposes</article-title>
          <source>Duke-Margolis Center for Health Policy</source>
          <year>2018</year>
          <month>10</month>
          <day>1</day>
          <access-date>2025-04-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://healthpolicy.duke.edu/sites/default/files/2020-03/characterizing_rwd.pdf">https://healthpolicy.duke.edu/sites/default/files/2020-03/characterizing_rwd.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dar</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Helfert</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Data provenance in healthcare: approaches, challenges, and future directions</article-title>
          <source>Sensors (Basel)</source>
          <year>2023</year>
          <month>07</month>
          <day>18</day>
          <volume>23</volume>
          <issue>14</issue>
          <fpage>6495</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s23146495"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s23146495</pub-id>
          <pub-id pub-id-type="medline">37514788</pub-id>
          <pub-id pub-id-type="pii">s23146495</pub-id>
          <pub-id pub-id-type="pmcid">PMC10384601</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ram</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A new perspective on semantics of data provenance</article-title>
          <source>Proceedings of the First International Conference on Semantic Web in Provenance Management</source>
          <year>2009</year>
          <conf-name>SWPM'09</conf-name>
          <conf-date>October 25, 2009</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ceur-ws.org/Vol-526/InvitedPaper_1.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>Provenance</article-title>
          <source>HL7 FHIR</source>
          <access-date>2025-11-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hl7.org/fhir/provenance.html">https://hl7.org/fhir/provenance.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>PROV-overview: an overview of the PROV family of documents</article-title>
          <source>W3C Working Group Note</source>
          <year>2013</year>
          <access-date>2025-11-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.w3.org/TR/2013/NOTE-prov-overview-20130430/">https://www.w3.org/TR/2013/NOTE-prov-overview-20130430/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cabalar</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Silber</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Hara</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abdallah</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Busch</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The role of blood testing in prevention, diagnosis, and management of chronic diseases: a review</article-title>
          <source>Am J Med Sci</source>
          <year>2024</year>
          <month>10</month>
          <volume>368</volume>
          <issue>4</issue>
          <fpage>274</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0002-9629(24)01169-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.amjms.2024.04.009</pub-id>
          <pub-id pub-id-type="medline">38636653</pub-id>
          <pub-id pub-id-type="pii">S0002-9629(24)01169-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vesper</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>WG</given-names>
            </name>
          </person-group>
          <article-title>Current practices and challenges in the standardization and harmonization of clinical laboratory tests</article-title>
          <source>Am J Clin Nutr</source>
          <year>2016</year>
          <month>09</month>
          <volume>104 Suppl 3</volume>
          <issue>Suppl 3</issue>
          <fpage>907S</fpage>
          <lpage>12S</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0002-9165(22)04947-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.3945/ajcn.115.110387</pub-id>
          <pub-id pub-id-type="medline">27534625</pub-id>
          <pub-id pub-id-type="pii">S0002-9165(22)04947-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC5004491</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Muñoz Monjas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rubio Ruiz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez Del Rey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Palchuk</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <article-title>Enhancing real world data interoperability in healthcare: a methodological approach to laboratory unit harmonization</article-title>
          <source>Int J Med Inform</source>
          <year>2025</year>
          <month>01</month>
          <volume>193</volume>
          <fpage>105665</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2024.105665</pub-id>
          <pub-id pub-id-type="medline">39500036</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(24)00328-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hajia</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Secondary use of laboratory data: potentialities and limitations</article-title>
          <source>Iran J Pathol</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>3</issue>
          <fpage>188</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31582994"/>
          </comment>
          <pub-id pub-id-type="doi">10.30699/ijp.2019.95692.1942</pub-id>
          <pub-id pub-id-type="medline">31582994</pub-id>
          <pub-id pub-id-type="pmcid">PMC6742739</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khela</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Khalil</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Daxon</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Neilson</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shahrokhi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Real world challenges in maintaining data integrity in electronic health records in a cancer program</article-title>
          <source>Tech Innov Patient Support Radiat Oncol</source>
          <year>2024</year>
          <month>03</month>
          <volume>29</volume>
          <fpage>100233</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-6324(23)00033-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.tipsro.2023.100233</pub-id>
          <pub-id pub-id-type="medline">38293266</pub-id>
          <pub-id pub-id-type="pii">S2405-6324(23)00033-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC10824972</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zayed</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Sarikakis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Delvaux</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Automated standardization and harmonization of laboratory units in large-scale clinical data using open-source R functions</article-title>
          <source>Int J Med Inform</source>
          <year>2026</year>
          <month>01</month>
          <volume>205</volume>
          <fpage>106131</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(25)00348-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.106131</pub-id>
          <pub-id pub-id-type="medline">41061385</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(25)00348-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bietenbeck</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boeker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>NPU, LOINC, and SNOMED CT: a comparison of terminologies for laboratory results reveals individual advantages and a lack of possibilities to encode interpretive comments</article-title>
          <source>J Lab Med</source>
          <year>2018</year>
          <volume>42</volume>
          <issue>6</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.degruyterbrill.com/document/doi/10.1515/labmed-2018-0103/html?lang=en&amp;srsltid=AfmBOopQEdfnlDAgyp1w00VOP5tVd-0pBWAnU1Hu5837cDY9cL6jLr9t"/>
          </comment>
          <pub-id pub-id-type="doi">10.1515/labmed-2018-0103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schadow</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>The unified code for units of measure</article-title>
          <source>UCUM Organization</source>
          <year>2024</year>
          <access-date>2025-05-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ucum.org/ucum">https://ucum.org/ucum</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vogl</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ingenerf</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chantraine</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Drenkhahn</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>LUMA: a mapping assistant for standardizing the units of LOINC-coded laboratory tests</article-title>
          <source>Appl Sci</source>
          <year>2022</year>
          <month>06</month>
          <day>08</day>
          <volume>12</volume>
          <issue>12</issue>
          <fpage>5848</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/2076-3417/12/12/5848"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/app12125848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <article-title>Datatypes</article-title>
          <source>HL7 FHIR</source>
          <access-date>2025-05-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hl7.org/fhir/datatypes.html#Quantity">https://hl7.org/fhir/datatypes.html#Quantity</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <article-title>Representing units of measure (for use with numerical references and values)</article-title>
          <source>Assistant Secretary for Technology Policy</source>
          <access-date>2025-05-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.healthit.gov/isp/representing-units-measure-use-numerical-references-and-values">http://www.healthit.gov/isp/representing-units-measure-use-numerical-references-and-values</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <article-title>PrecisionHealthIntelligence</article-title>
          <source>GitHub</source>
          <access-date>2026-03-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/PrecisionHealthIntelligence/loinc_unit_harmonization">https://github.com/PrecisionHealthIntelligence/loinc_unit_harmonization</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <source>ConcerAI</source>
          <access-date>2026-03-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.concertai.com/contact-us/">https://www.concertai.com/contact-us/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
