<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v14i1e83487</article-id>
      <article-id pub-id-type="pmid">41780922</article-id>
      <article-id pub-id-type="doi">10.2196/83487</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Scalable and Privacy-Conscious End-to-End Processing of Large-Scale Clinical Data for Precision Medicine: Empirical Evaluation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kalluchi</surname>
            <given-names>Achyuth</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>He</surname>
            <given-names>Yingnan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Jungwoo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-2983-4436</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Hwang</surname>
            <given-names>Sangwon</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8666-7479</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Kyu Hee</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Precision Medicine</institution>
            <institution>Yonsei University Wonju College of Medicine</institution>
            <addr-line>20 Ilsan-ro, Wonju-si, Gangwon-do</addr-line>
            <addr-line>Wonju, 26417</addr-line>
            <country>Republic of Korea</country>
            <phone>82 82 741 0466</phone>
            <email>powerpc@yonsei.ac.kr</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7378-3697</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Artificial Intelligence Big Data Medical Center</institution>
        <institution>Yonsei University Wonju College of Medicine</institution>
        <addr-line>Wonju</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Precision Medicine</institution>
        <institution>Yonsei University Wonju College of Medicine</institution>
        <addr-line>Wonju</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Kyu Hee Lee <email>powerpc@yonsei.ac.kr</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>4</day>
        <month>3</month>
        <year>2026</year>
      </pub-date>
      <volume>14</volume>
      <elocation-id>e83487</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>9</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>1</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>5</day>
          <month>2</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Jungwoo Lee, Sangwon Hwang, Kyu Hee Lee. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 04.03.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2026/1/e83487" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>In large-scale clinical data analysis, CSV and traditional relational database management system–based approaches are widely used but impose substantial storage and processing constraints that delay research preparation and hinder multicenter collaboration. Although column-oriented storage formats such as Apache Parquet have gained attention in data science, systematic end-to-end evaluations in clinical environments remain limited, particularly regarding efficiency and scalability.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to empirically evaluate whether a Parquet-based end-to-end pipeline could improve computational efficiency and scalability in large-scale clinical data analysis while preserving predictive performance and protecting privacy.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Electronic health record data comprising 13.76 million rows from a large academic medical center in Korea were analyzed using Parquet, CSV, PostgreSQL, and DuckDB environments. Standardized SQL workloads and multilabel classification models—implemented using graphics processing unit–accelerated Extreme Gradient Boosting and classifier chain (CC) ensembles to address class imbalance—were applied to evaluate storage efficiency, time to analysis, and predictive performance. Statistical equivalence testing with prespecified clinical margins and bootstrap resampling ensured rigorous comparison, while privacy risks were assessed through advanced membership inference attacks (MIA), including shadow MIA and likelihood ratio attacks.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Compared with CSV, Parquet demonstrated enhanced computational efficiency by lowering disk access from 940.2 to 44.2 seconds (95.3% reduction). End-to-end processing latency was substantially reduced across feature transformation (15.0 vs 9.3 s) and model training (8.1 vs 6.7 s). To address complex clinical correlations, we implemented CC and one-vs-rest architectures, which effectively captured interdependencies between disease labels. Classification performance remained statistically equivalent across area under the receiver operating characteristic curve, area under the precision-recall curve, accuracy, and <italic>F</italic><sub>1</sub>-score, with all differences falling within prespecified clinical equivalence margins (<italic>P</italic>&#60;.001). Notably, the CC ensemble demonstrated high technical rigor, minimizing Hamming loss (2.2×10<sup>–4</sup>) and ensuring robustness even in imbalanced cohorts. MIA performed at chance level (area under the curve=0.500), suggesting no measurable increase in privacy risk.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>By significantly mitigating data processing bottlenecks, a Parquet-based pipeline enabled high-throughput, large-scale clinical evidence generation without compromising model integrity or patient privacy. This framework provides a scalable and robust infrastructure for precision medicine, facilitating agile multicenter collaborations and real-world data analysis in resource-constrained clinical environments.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>electronic health records</kwd>
        <kwd>medical informatics</kwd>
        <kwd>predictive performance</kwd>
        <kwd>data privacy</kwd>
        <kwd>precision medicine</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Clinical data, including diagnostic reports, prescriptions, laboratory results, and imaging data, hold substantial potential for precision medicine, predictive modeling, and collaborative research. The volume of electronic health records (EHRs) generated in clinical practice has grown exponentially with the expansion of digital health systems [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. However, as datasets expand, bottlenecks, such as storage overhead, transmission delays, and slow query execution, become increasingly common. These challenges cannot be resolved simply by expanding storage capacity; instead, they necessitate more efficient frameworks for data storage and processing.</p>
      <p>In medical informatics, data are most commonly stored in row-oriented formats, such as CSV files, spreadsheets, and relational databases. Although valued for their simplicity and interoperability, these approaches exhibit clear limitations in storage efficiency and analytic scalability. CSV files are uncompressed and large in size, restricting input and output throughput, while relational databases often underperform in column-level operations. In contrast, column-oriented formats offer high compression and selective input and output, making them well suited for high-volume and cloud-based environments. Among these, Apache Parquet is widely used as a standard solution owing to its scalability and interoperability [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. However, few studies have systematically evaluated its end-to-end performance in clinical pipelines that incorporate deidentification procedures.</p>
      <p>A further challenge in clinical data use is balancing privacy protection with data utility. Deidentification is mandatory in multicenter research and machine learning, but it may affect statistical distributions or compromise predictive performance. Understanding how storage architectures interact with deidentification to influence analytic outcomes is therefore of both academic and practical importance [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>Unlike prior studies that focused solely on benchmarking computational efficiency, this work integrates privacy risk assessment and formal equivalence testing into a real-world end-to-end pipeline, thereby providing a clinically meaningful evaluation of Parquet as a foundation for precision medicine and collaborative research. Against this background, this study developed a scalable Parquet-based pipeline for high-volume clinical data and empirically assessed its storage efficiency, computational throughput, and preservation of predictive performance. This study also sought to establish a reliable infrastructure that enables cohort construction, secure data sharing, and clinical decision support in multicenter and precision medicine research [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref23">23</xref>].</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>This retrospective observational study was conducted using real-world EHR data. The study protocol was approved by the institutional review board of Wonju Severance Christian Hospital (CR325065). The requirement for informed consent was waived by the institutional review board due to the retrospective nature of the study and the use of deidentified data. All data processing was performed within an independent honest broker system, and investigators had access only to deidentified data. No compensation was provided to the participants as there was no direct contact or intervention involved. The entire process complied with the Personal Information Protection Act of Korea, the Health Insurance Portability and Accountability Act Safe Harbor standard, and the General Data Protection Regulation [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      </sec>
      <sec>
        <title>Integrated End-to-End Clinical Data Processing Workflow</title>
        <p>We developed an integrated pipeline connecting 5 core stages: raw EHR ingestion, privacy-preserving preprocessing (ISO 8601 and <italic>k</italic>-anonymity), scalable infrastructure using Apache Parquet, multilabel modeling via graphics processing unit (GPU)–accelerated Extreme Gradient Boosting (XGBoost), and rigorous statistical and privacy audits (<xref rid="figure1" ref-type="fig">Figure 1</xref>). To optimize analytic performance, we adopted a column-oriented storage format (Apache Parquet) over the traditional row-oriented structure (eg, CSV) [<xref ref-type="bibr" rid="ref6">6</xref>]. For comparative evaluation, the same dataset was also maintained in CSV format. While row-oriented structures excel in transactional tasks, columnar storage significantly reduces input and output overhead and enhances compression efficiency for complex analytic queries. This architectural choice is specifically tailored for the high dimensionality and sparse distribution of clinical datasets, ensuring both system scalability and robust privacy protection across the entire workflow.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Integrated workflow for scalable and privacy-preserving clinical data processing. AUROC: area under the receiver operating characteristic curve; AUPRC: area under the precision-recall curve; CC: classifier chains; EHR: electronic health record; GDPR: General Data Protection Regulation; GPU: graphics processing unit; HIPAA: Health Insurance Portability and Accountability Act; ICD-10: International Classification of Diseases, Tenth Revision; KCD: Korean Classification of Diseases, Eighth Revision; LiRA: Likelihood Ratio Attack; MIA: membership inference attack; OvR: one-vs-rest; PIPA: Personal Information Protection Act; TOST: two 1-sided tests; XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e83487_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Preparation and Transformation</title>
        <p>The dataset included patient demographics, diagnostic codes based on the International Classification of Diseases, Tenth Revision (ICD-10) [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref35">35</xref>] and the Korean Classification of Diseases, Eighth Revision (KCD-8), visit type, and prescription records. In total, the dataset comprised approximately 13.76 million rows (43 columns, approximately 3.2 GB), as detailed in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. After replacing patient identifiers with randomly generated surrogate IDs, quasi-identifiers were generalized to satisfy <italic>k</italic>-anonymity (<italic>k</italic>=5). Data cleansing further ensured quality control by standardizing date fields into the ISO-compliant format (YYYY-MM-DD).</p>
      </sec>
      <sec>
        <title>Clinical Data Processing Pipeline</title>
        <p>Clinical data processing followed a stepwise pipeline designed to reflect clinical context. In preprocessing, we standardized date formats, removed records with missing sex, and normalized sex codes (eg, “men” to M and “women” to F). Duplicate entries were resolved by retaining only the most recent record for identical combinations of patient, date, and diagnosis code. Visits were segmented into episodes by department changes or temporal gaps, and each episode was assigned an episode identifier. Episode-level summaries included episode duration, event count, and primary diagnosis status. To capture temporal continuity, a 90-day rolling window was applied to compute diagnosis counts and code diversity per patient. Monthly aggregates were then derived, including patient counts, code diversity, and primary diagnosis counts, with patient-month statistics summarized using quantiles (eg, p50 and p90). The diagnostic records for the targeted conditions—including I10.9, E10-E14, and M48.06—were identified and extracted to construct the final summary tables, which were then stored in both CSV and Parquet formats for comparative analysis. The stepwise process is illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Stepwise scenario of the clinical data processing pipeline.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e83487_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Database Workload Benchmarking</title>
        <p>To evaluate the efficiency of storage formats, scenario-based workloads were executed in DuckDB (DuckDB Labs) [<xref ref-type="bibr" rid="ref36">36</xref>] and PostgreSQL (PostgreSQL Global Development Group) [<xref ref-type="bibr" rid="ref37">37</xref>] environments. Synthetic example data are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. Identical datasets were loaded into Parquet-based DuckDB and row-store PostgreSQL, and complex SQL queries—adapted from TPC-DS patterns [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>] (eg, window functions, multidimensional aggregation, and ROLLUP)—were applied to compare performance. Resource use was further examined by varying chunk sizes (10,000-50,000 records) with detailed results in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
      </sec>
      <sec>
        <title>Predictive Modeling and Multilabel Strategy</title>
        <p>Predictive modeling assessed the impact of storage formats on classification performance for hypertension (I10.9), spinal disorders (M48.06), and diabetes (E10-E14). Patient-level diagnostic histories were transformed into 2<sup>18</sup> dimensional sparse vectors (approximately 262,000 features) via FeatureHasher (scikit-learn; Python Software Foundation) [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>]. The dataset was randomly partitioned into training (65%), validation (15%), and test (20%) subsets with a fixed seed of 42. Classification models were implemented using GPU-accelerated XGBoost with positive class weighting to address imbalance [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. Hyperparameter details are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
        <p>For multilabel classification, we applied one-vs-rest (OvR) [<xref ref-type="bibr" rid="ref46">46</xref>] and classifier chains (CC) [<xref ref-type="bibr" rid="ref47">47</xref>]. To mitigate label-order dependence and evaluate interlabel dependencies, we constructed ensembles of 5 strategically ordered chains encompassing a prevalence gradient—from high-prevalence anchors (hypertension and diabetes) to the sparse target, spinal stenosis (M48.06, 0.50%; <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). Prioritizing M48.06, a domain-independent and sparse condition, served to demonstrate model robustness even without the clustering benefits of related disease families (eg, I-series codes). To ensure the rigorous prevention of label leakage and validate the integrity of the performance gains, all defining ICD-10 codes were strictly excluded from the feature space. This setup ensured that the model’s predictive capability relied solely on statistical associations across hundreds of thousands of nondiagnostic features. Model performance was evaluated using area under the receiver operating characteristic curve (AUROC), area under the precision-recall curve (AUPRC), accuracy, and <italic>F</italic><sub>1</sub>-score, calculated for each label as well as macroaverages and microaverages.</p>
      </sec>
      <sec>
        <title>Statistical Evaluation and Privacy Assessment</title>
        <p>Model performance was evaluated using AUROC, AUPRC, accuracy, and <italic>F</italic><sub>1</sub>-score. To assess model reliability, calibration was further evaluated using the Brier score and expected calibration error (ECE), with detailed results provided in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>. CSV and Parquet results were compared using paired runs with shared identifiers. Normality was assessed via the Shapiro-Wilk test, followed by paired 2-tailed <italic>t</italic> tests or Wilcoxon signed-rank tests with Bonferroni correction (<italic>P</italic>&#60;.05) [<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        <p>Equivalence was assessed via two 1-sided tests (TOST) [<xref ref-type="bibr" rid="ref51">51</xref>] and 95% bootstrap CIs. Equivalence margins (δ) were prespecified at 0.02 for AUROC or AUPRC and 0.01 for accuracy or <italic>F</italic><sub>1</sub>-score. These thresholds were selected to be narrower than the 0.05 margin commonly used in clinical equivalence trials [<xref ref-type="bibr" rid="ref52">52</xref>] and are more conservative than performance variances typically observed in the external validation of clinical artificial intelligence (AI) systems [<xref ref-type="bibr" rid="ref53">53</xref>]. Such strict margins were intended to constrain observed differences to ranges generally regarded as clinically negligible, particularly for high-performing models operating within an elevated accuracy range (0.98-1.00).</p>
        <p>To mitigate stochastic variation, a fixed random seed was applied across all experiments, ensuring that observed differences reflected data handling effects rather than algorithmic randomness. Privacy was further audited using membership inference attacks (MIA)—including confidence, entropy, loss-based (Yeom), shadow, and Likelihood Ratio Attack (LiRA) strategies—under patient-level stratified splits (train: 240,596; test: 240,597) to verify model robustness.</p>
      </sec>
      <sec>
        <title>Experimental Setup and Reproducibility</title>
        <p>All experiments were conducted on a Linux Ubuntu 22.04 server with a 24-core central processing unit (CPU), 128-GB memory, and an NVIDIA RTX 5090 GPU (CUDA 12.2, cuDNN 8.9, driver 550.54). Data processing used Python (version 3.10; Python Software Foundation) with Pandas 1.5.3, PyArrow 12.0.1, scikit-learn 1.3.2, and XGBoost 2.0.3 (GPU-hist). Multiprocessing was implemented using the standard Python multiprocessing module.</p>
        <p>As specified in the modeling strategy, XGBoost was configured with a learning rate of 0.08, maximum depth of 6, and 1000 estimators. To handle class imbalance, task-specific <italic>scale_pos_weight</italic> and an ensemble of 5 CCs were used. All random operations used a fixed seed of 42 for reproducibility. For robust performance evaluation, we conducted 20 independent experimental runs and used 5000-iteration bootstrap resampling to compute 95% CIs. Detailed hyperparameters and the statistical framework for equivalence testing are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Storage and Pipeline Efficiency</title>
        <p>Conversion to Parquet substantially improved storage efficiency, reducing file size by nearly 6.9-fold relative to CSV. As summarized in <xref ref-type="table" rid="table1">Table 1</xref>, Parquet also consistently outperformed CSV across the end-to-end pipeline. File loading (input and output) time decreased by more than 95%, and both feature transformation (FeatureHasher) and model training (XGBoost) were faster under Parquet. Although peak CPU memory was about 1.3 GB higher, GPU memory consumption decreased by 326 MB, resulting in stable overall resource use. Resource consumption remained stable at 9 to 10 GB across chunk sizes, reflecting consistent scalability, with efficiency varying by chunk size. The values in <xref ref-type="table" rid="table1">Table 1</xref> represent peak use in end-to-end runs, with minor variations arising from measurement conditions, whereas CPU, memory, and disk input and output patterns remained consistent across chunk sizes (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>System performance comparison between CSV and Parquet formats.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="300"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Metric</td>
                <td colspan="2">CSV, mean (SD)</td>
                <td colspan="2">Parquet, mean (SD)</td>
                <td>Difference<sup>a</sup> (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Time (s)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Input and output duration</td>
                <td colspan="2">940.2 (53.3)</td>
                <td colspan="2">44.2 (1.6)</td>
                <td colspan="2">−896.0 (−930.0 to −860.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Feature transformation</td>
                <td colspan="2">15.0 (0.9)</td>
                <td colspan="2">9.3 (0.7)</td>
                <td colspan="2">−5.7 (−7.0 to −4.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Model training</td>
                <td colspan="2">8.1 (1.2)</td>
                <td colspan="2">6.7 (0.9)</td>
                <td colspan="2">−1.4 (−2.5 to −0.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Resource use</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Memory maximum (GB)</td>
                <td colspan="2">21.2 (0.8)</td>
                <td colspan="2">22.5 (0.6)</td>
                <td colspan="2">1.3 (0.1 to 2.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GPU<sup>b</sup> memory maximum (MB)</td>
                <td colspan="2">4873.0 (582.6)</td>
                <td colspan="2">4547.0 (596.9)</td>
                <td colspan="2">−326.0 (−450.0 to −200.0)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Calculated as the Parquet mean minus CSV mean.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>GPU: graphics processing unit.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Classification Performance and Calibration</title>
        <p>Single-label results are presented in <xref ref-type="table" rid="table2">Table 2</xref>. All 3 tasks achieved AUROC values above 0.920, with AUPRC ranging from 0.488 to 0.580. Hypertension (I10.9) yielded the highest <italic>F</italic><sub>1</sub>-score (0.599), followed by spinal disorders (M48.06, 0.536) and diabetes (E10-E14, 0.521). Macroaveraged performance reached an AUROC of 0.920, an AUPRC of 0.545, an accuracy of 0.934, and an <italic>F</italic><sub>1</sub>-score of 0.552. Calibration analyses [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], reported in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>, demonstrated excellent reliability for hypertension (Brier score 2.1×10<sup>–5</sup>; ECE 6.0×10<sup>–6</sup>), while spinal disorders (ECE=0.016) and diabetes (ECE=0.018) showed mild miscalibration but remained within recommended thresholds (ECE&#60;0.020).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Per-label classification performance using extreme gradient boosting.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Labels</td>
                <td>AUROC<sup>a</sup></td>
                <td>AUPRC<sup>b</sup></td>
                <td>Accuracy</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Hypertension</td>
                <td>0.920</td>
                <td>0.580</td>
                <td>0.906</td>
                <td>0.599</td>
              </tr>
              <tr valign="top">
                <td>Spine disorder</td>
                <td>0.941</td>
                <td>0.488</td>
                <td>0.982</td>
                <td>0.536</td>
              </tr>
              <tr valign="top">
                <td>Diabetes<sup>c</sup></td>
                <td>0.899</td>
                <td>0.567</td>
                <td>0.915</td>
                <td>0.521</td>
              </tr>
              <tr valign="top">
                <td>Macroaverage</td>
                <td>0.920</td>
                <td>0.545</td>
                <td>0.934</td>
                <td>0.552</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>AUPRC: area under the precision-recall curve.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Diabetes mellitus (International Classification of Diseases, Tenth Revision codes: E10-E14).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table2">Table 2</xref> evaluates label-specific discrimination under substantial class imbalance, whereas <xref ref-type="table" rid="table3">Table 3</xref> summarizes overall multilabel prediction performance using microaveraged aggregation across all label–instance pairs. Specifically, <xref ref-type="table" rid="table2">Table 2</xref> focuses on the predictive performance of individual sparse labels, while <xref ref-type="table" rid="table3">Table 3</xref> reflects aggregated performance across all prediction events. Multilabel results in <xref ref-type="table" rid="table3">Table 3</xref> confirmed high-performance consistency for both OvR and CC, with AUROC &#62;0.999 and AUPRC &#62;0.998. Subset accuracy was identical (0.999), but CC showed slight improvements in Hamming loss and Jaccard index [<xref ref-type="bibr" rid="ref56">56</xref>], suggesting modest benefits from capturing label dependencies. A numerical gap was observed between per-label AUPRC (approximately 0.5; <xref ref-type="table" rid="table2">Table 2</xref>) and multilabel AUPRC (near 1.0; <xref ref-type="table" rid="table3">Table 3</xref>). This reflects the technical difference in aggregation: multilabel metrics were calculated using microaveraging to evaluate the overall model efficacy.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Multilabel classification performance.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="200"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Models</td>
                <td colspan="2">AUROC<sup>a</sup></td>
                <td colspan="2">AUPRC<sup>b</sup></td>
                <td colspan="2">Hamming loss</td>
                <td colspan="2">Subset accuracy</td>
                <td>Jaccard index</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  <bold>One-vs-rest</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Microaverage</td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.998</td>
                <td colspan="2">2.4×10<sup>–4</sup></td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.997</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Macroaverage</td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.998</td>
                <td colspan="2">—<sup>c</sup></td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Classifier chains</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Microaverage</td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.998</td>
                <td colspan="2">2.2×10<sup>–4</sup></td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.997</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Macroaverage</td>
                <td colspan="2">0.999</td>
                <td colspan="2">0.998</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>AUPRC: area under the precision-recall curve.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Although discrimination remained high across all tasks, calibration analyses revealed modest overconfidence for diabetes and spinal disorder models. These deviations, while within accepted thresholds, emphasize the importance of calibration-aware adjustments when deploying predictive models in clinical workflows.</p>
      </sec>
      <sec>
        <title>Database Benchmarking</title>
        <p>As summarized in <xref ref-type="table" rid="table4">Table 4</xref>, DuckDB executed analytic workloads with an approximately 28-fold reduction in wall-clock time compared with PostgreSQL, which required 2546.4 seconds. DuckDB also exhibited higher CPU use (72.1% vs 39.6%), while memory consumption was comparable across systems.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Performance comparison of DuckDB and PostgreSQL in scenario-based SQL workloads.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="440"/>
            <col width="210"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td>Metrics</td>
                <td>DuckDB<sup>a</sup></td>
                <td>PostgreSQL<sup>b</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Wall-clock time (s)</td>
                <td>90.2</td>
                <td>2546.4</td>
              </tr>
              <tr valign="top">
                <td>CPU<sup>c</sup> use (%)</td>
                <td>72.1</td>
                <td>39.6</td>
              </tr>
              <tr valign="top">
                <td>Memory use (GB)</td>
                <td>13.7</td>
                <td>14.8</td>
              </tr>
              <tr valign="top">
                <td>Read throughput (MB/s)</td>
                <td>554.7</td>
                <td>365.2</td>
              </tr>
              <tr valign="top">
                <td>Write throughput (MB/s)</td>
                <td>1116.0</td>
                <td>998.0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>DuckDB: column-oriented database optimized for analytical workloads.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>PostgreSQL: row-oriented relational database primarily designed for transactional workloads, with support for analytical queries.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>CPU: central processing unit.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Equivalence Analysis</title>
        <p>Paired experiments (20 runs per condition) were conducted using shared run identifiers, with median and IQR values provided in Table S1 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. Several metrics converged across all repetitions, producing zero IQR values and demonstrating high algorithmic stability. Overall, both formats achieved robust numerical consistency across all experimental iterations; for instance, mean AUROC was 1.000 for CSV and 0.984 for Parquet (Δ=−0.015). While other metrics (AUPRC, accuracy, and <italic>F</italic><sub>1</sub>-score) were slightly higher under the CSV format, paired <italic>t</italic> tests and Wilcoxon signed-rank tests confirmed statistical significance after Bonferroni correction (<italic>P</italic>&#60;.001; Table S2 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). However, these numerical variations remained minimal.</p>
        <p>Notably, all observed differences fell within the prespecified equivalence margins (δ=0.02 for AUROC and AUPRC and δ=0.01 for accuracy and <italic>F</italic><sub>1</sub>-score). TOST confirmed statistical equivalence (<italic>P</italic>&#60;.05) across all evaluated metrics, and bootstrap 95% CIs for AUROC Δ (−0.016 to −0.015) further reflected near-zero variability consistent with asymptotic performance stability (Table S3 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>).</p>
      </sec>
      <sec>
        <title>Privacy Assessment</title>
        <p>The MIA evaluations, performed based on established methodologies [<xref ref-type="bibr" rid="ref57">57</xref>-<xref ref-type="bibr" rid="ref59">59</xref>] and summarized in <xref ref-type="table" rid="table5">Table 5</xref>, produced area under the curve (AUC) values of 0.501, 0.502, and 0.499 for confidence, entropy, and loss-based strategies, respectively. The maximum advantage did not exceed 0.007, and the gain over random guessing was ≤0.003. Attack performance was indistinguishable from random guessing, indicating no additional privacy risk. Additional shadow and LiRA [<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>] results are available in <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>, corroborating these findings.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Membership inference attack results across different attack strategies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="220"/>
            <col width="150"/>
            <col width="190"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td>Attack strategy</td>
                <td>Attack AUC<sup>a</sup> (95% CI)</td>
                <td>Advantage</td>
                <td>Best accuracy</td>
                <td>Gain vs baseline</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Confidence</td>
                <td>0.501 (0.501-0.503)</td>
                <td>0.006</td>
                <td>0.503</td>
                <td>0.003</td>
              </tr>
              <tr valign="top">
                <td>Entropy</td>
                <td>0.502 (0.502-0.503)</td>
                <td>0.007</td>
                <td>0.503</td>
                <td>0.003</td>
              </tr>
              <tr valign="top">
                <td>Loss (Yeom)</td>
                <td>0.499 (0.498-0.499)</td>
                <td>0.002</td>
                <td>0.500</td>
                <td>0.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>AUC: area under the curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study successfully implemented an integrated end-to-end pipeline (<xref rid="figure1" ref-type="fig">Figure 1</xref>) that ensures a seamless transition from raw EHR data ingestion to predictive modeling. By leveraging Apache Parquet, the framework effectively addressed storage and processing bottlenecks—specifically, input and output latency—inherent in traditional row-oriented workflows, substantially enhancing data throughput and accelerating the analytic preparatory phase while maintaining high predictive fidelity. Furthermore, our findings indicate that the minor performance discrepancies between formats are attributable to systematic data handling effects under a strictly controlled environment. Beyond these computational efficiencies, privacy evaluations demonstrated that the optimized workflow maintains rigorous data protection standards, providing a secure foundation for multicenter research operations without introducing additional vulnerabilities.</p>
        <p>Although paired statistical tests yielded highly significant <italic>P</italic> values (<italic>P</italic>&#60;.001), this result reflects the sensitivity of paired testing under large-scale data and repeated bootstrap evaluation rather than clinically meaningful divergence. From an equivalence perspective, all performance differences remained well within the prespecified margins, confirming that the Parquet-based pipeline achieves practical performance equivalence to the traditional CSV workflow.</p>
        <p>The substantial improvement in multilabel AUPRC compared with per-label performance highlights the system-level predictive advantage gained by explicitly modeling interlabel dependencies. While individual disease prediction remains challenging under substantial class imbalance, the multilabel formulation enables the model to capture clinically meaningful comorbidity structures, thereby reframing the observed performance gap as a reflection of holistic predictive efficacy rather than a metric artifact. This gap was also driven by the extreme class imbalance inherent in clinical datasets (eg, 0.50% prevalence for spinal disorders), where high AUROCs can coexist with lower <italic>F</italic><sub>1</sub>-scores. By integrating these dependencies within the CC architecture, the model leveraged frequent clinical co-occurrence patterns—such as hypertension and diabetes—to stabilize predictions for sparse conditions, including spinal stenosis. Importantly, the consistent performance observed despite the strict exclusion of all defining ICD-10 codes provided strong evidence against label leakage and underscored the model’s reliance on nondiagnostic clinical associations.</p>
      </sec>
      <sec>
        <title>Clinical Implications and Research Operations</title>
        <p>The clinical implications were considerable. By substantially shortening preparatory phases and enabling analyses to be completed within hours rather than days, Parquet-based pipelines allowed investigators to progress more rapidly from raw data to actionable evidence. Such improvements not only accelerated study initiation but also facilitated the integration of predictive models into research and clinical workflows. In multicenter settings, scalability supported the efficient integration of heterogeneous patient populations without excessive computational cost, thereby enhancing reproducibility and advancing precision medicine initiatives. These efficiencies were directly relevant to clinical workflows and regulatory-grade analyses. They enabled interim analyses and timely regulatory submissions, supporting more responsive and efficient research operations.</p>
      </sec>
      <sec>
        <title>Privacy and Security Safeguards</title>
        <p>Privacy evaluation reinforced the suitability of this approach. Deidentification procedures satisfied k-anonymity, and MIA yielded chance-level performance. The chance-level performance of multiple MIA methods confirmed that computational gains do not compromise patient confidentiality, a prerequisite for secure collaboration across institutions. Patient-level stratification and consistent pipeline design acted as effective safeguards. While residual risks remain inherent to secondary data use, our findings suggested that Parquet does not introduce additional vulnerabilities. For collaborative research networks—where privacy assurances are essential for sharing—these results provide practical reassurance.</p>
      </sec>
      <sec>
        <title>Interpretation of Predictive Performance and Label Dependencies</title>
        <p>Classification analyses revealed stable performance for common conditions such as hypertension, whereas imbalanced disorders such as diabetes and spinal disease yielded lower scores. This pattern highlights the need to account for dataset structure and interlabel dependencies when interpreting predictive outputs. The elevated AUROC values likely reflect the combination of high-prevalence conditions and extensive diagnostic feature sets. Consistent with the modeling strategy, defining codes were excluded from the feature space; however, correlated diagnostic features may still have influenced performance estimates.</p>
        <p>While performance convergence at elevated levels constrained the sensitivity to subtle comparative differences, it underscored the robustness and reproducibility of the pipeline, supporting its suitability for large-scale clinical research, where stability and reliability are critical. Predictive reliability was not compromised by storage structure, supporting Parquet as a dependable option for secondary use of EHR data in diverse research settings.</p>
      </sec>
      <sec>
        <title>Model Reliability and Calibration</title>
        <p>Calibration analyses further showed that hypertension models were well aligned with observed risks, whereas diabetes and spinal disorder tasks exhibited modest miscalibration. These results underscore that even high-performing classifiers may generate overconfident probability estimates, a limitation directly relevant to clinical decision support. Future studies should evaluate calibration-aware techniques, such as temperature scaling or isotonic regression, to improve the reliability of probability estimates (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>).</p>
        <p>Beyond technical validation, the findings demonstrated practical value for clinical research operations. Large-scale trials and observational studies often face delays in cohort assembly and iterative validation; Parquet-based pipelines shorten these steps, enabling more adaptive study designs. In multicenter collaborations, they promote secure and efficient data exchange, reducing delays that commonly impede cooperative studies.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Several limitations should be acknowledged. First, the datasets analyzed were derived from specific institutional cohorts, which may constrain generalizability to other health care systems. Second, the elevated performance baseline of the predictive models limited the sensitivity to subtle differences between CSV and Parquet formats. Third, while MIA offered a widely accepted proxy for privacy risk, broader adversarial evaluations were not included. Fourth, the evaluation was primarily conducted in on-premise settings, so the scalability of findings in distributed or cloud-based environments remains to be established. Finally, despite the clear efficiency advantages of Parquet, its adoption may introduce a technical learning curve for clinical researchers who are less familiar with column-oriented storage formats or big-data frameworks. Transitioning from traditional row-oriented workflows to optimized columnar architectures requires initial investments in technical training and infrastructure adjustment. However, these upfront efforts are likely to be offset by the long-term gains in scalability and processing speed demonstrated in our results, ultimately supporting more efficient and reproducible clinical evidence generation.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>Future research should extend the evaluation of Parquet-based pipelines to distributed and cloud-based environments, focusing on both scalability and cost-effectiveness. In addition, validation across hybrid and federated architectures will be important to confirm applicability in multicenter collaborations where data cannot be centralized. Beyond structured EHR data, future studies should also investigate applications to unstructured modalities, such as clinical narratives, imaging metadata, and time-series signals. Such efforts would test the versatility of Parquet-based pipelines in supporting multimodal learning and integrative analyses. Privacy assessments should likewise be expanded to encompass attribute inference, linkage, and other adversarial scenarios, ideally within federated or privacy-preserving analytic frameworks. Moreover, interoperability across international coding standards should be validated using external multicenter datasets to ensure global applicability. Pursuing these directions will enhance the technical robustness of Parquet-based infrastructures while reinforcing their clinical relevance, ultimately enabling secure collaboration and more efficient integration of evidence into patient care.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrated that Parquet-based end-to-end processing effectively alleviated the storage and computational bottlenecks inherent in traditional row-oriented and relational database workflows while maintaining predictive fidelity and privacy safeguards. By improving computational efficiency and enabling the rapid preparation of analysis-ready cohorts, Parquet reduces the resources required for large-scale clinical data handling. These efficiencies translate into tangible research benefits, enabling earlier study initiation and more adaptive study designs across diverse clinical research settings.</p>
        <p>The integration of efficiency with privacy safeguards further ensures that accelerated workflows remain suitable for secure data sharing across institutions. In parallel, these capabilities support regulatory-grade analyses and health technology assessments, where timely and reproducible evidence is critical. For clinicians and researchers, the central implication is that Parquet-based pipelines reduce the manual effort and computational overhead required to transform raw EHR data into analysis-ready cohorts. This capability not only strengthens multicenter collaboration but also facilitates the timely translation of evidence into clinical decision support.</p>
        <p>Ultimately, by aligning computational efficiency with privacy-conscious infrastructure, Parquet-based pipelines reinforce the evidence base that informs clinical decision-making, positioning this approach as a robust foundation for sustainable precision medicine.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Column definitions for the structured clinical data table.</p>
        <media xlink:href="medinform_v14i1e83487_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 10 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Synthetic example data used for scenario-based workload evaluation.</p>
        <media xlink:href="medinform_v14i1e83487_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 24 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Resource use profiles during Parquet-based data processing across different chunk sizes.</p>
        <media xlink:href="medinform_v14i1e83487_app3.docx" xlink:title="DOCX File , 252 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Hyperparameter configurations and the formal statistical framework for equivalence testing.</p>
        <media xlink:href="medinform_v14i1e83487_app4.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Detailed demographic characteristics and visit statistics of the study cohort.</p>
        <media xlink:href="medinform_v14i1e83487_app5.png" xlink:title="PNG File , 235 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Calibration metrics (Brier score and expected calibration error [ECE] and ECE) for each binary classification task.</p>
        <media xlink:href="medinform_v14i1e83487_app6.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Integrated statistical performance and equivalence analysis.</p>
        <media xlink:href="medinform_v14i1e83487_app7.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Membership inference results with shadow and Likelihood Ratio Attack attackers.</p>
        <media xlink:href="medinform_v14i1e83487_app8.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUPRC</term>
          <def>
            <p>area under the precision-recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CC</term>
          <def>
            <p>classifier chains</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CPU</term>
          <def>
            <p>central processing unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ECE</term>
          <def>
            <p>expected calibration error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">GPU</term>
          <def>
            <p>graphics processing unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD-10</term>
          <def>
            <p>International Classification of Diseases, Tenth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">KCD-8</term>
          <def>
            <p>Korean Classification of Diseases, Eighth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LiRA</term>
          <def>
            <p>Likelihood Ratio Attack</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">MIA</term>
          <def>
            <p>membership inference attack</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">OvR</term>
          <def>
            <p>one-vs-rest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">TOST</term>
          <def>
            <p>two 1-sided tests</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the National Research Foundation of Korea (NRF) grant funded by the Korea government (grant RS-2025-24683718). This research was supported by the Ministry of Trade, Industry and Energy, Republic of Korea, under the project titled “Research and Development on AI Standardization in the Healthcare Industry Based on Human Big Data and Artificial Intelligence” (grant RS-2025-13882968), funded through the Korea Evaluation Institute of Industrial Technology. This research was supported by a grant from the medical data-driven hospital support project through the Korea Health Information Service, funded by the Ministry of Health and Welfare, Republic of Korea. This research was supported by the Regional Innovation System and Education program through the Gangwon Regional Innovation System and Education Center, funded by the Ministry of Education and the Gangwon State, Republic of Korea (grant 2025-RISE-10-006).</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>This study was funded by the following grants: (1) the National Research Foundation of Korea (NRF) grant funded by the Korea government (grant RS-2025-24683718); (2) a grant from the medical data-driven hospital support project through the Korea Health Information Service, funded by the Ministry of Health and Welfare, Republic of Korea; and (3) the Regional Innovation System and Education program through the Gangwon Regional Innovation System and Education Center, funded by the Ministry of Education and the Gangwon State, Republic of Korea (grant 2025-RISE-10-006). The funders had no involvement in the study design, data collection, analysis, interpretation, or the writing of the manuscript.</p>
      </sec>
    </notes>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: KHL</p>
        <p>Data curation: JL</p>
        <p>Formal analysis: JL, KHL</p>
        <p>Methodology: SH</p>
        <p>Project administration: KHL</p>
        <p>Resources: JL</p>
        <p>Writing – original draft: JL, SH</p>
        <p>Writing – review and editing: KHL</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brunak</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Mining electronic health records: towards better research applications and clinical care</article-title>
          <source>Nat Rev Genet</source>
          <year>2012</year>
          <month>05</month>
          <day>02</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>395</fpage>
          <lpage>405</lpage>
          <pub-id pub-id-type="doi">10.1038/nrg3208</pub-id>
          <pub-id pub-id-type="medline">22549152</pub-id>
          <pub-id pub-id-type="pii">nrg3208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22733976"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="medline">22733976</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Albers</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Next-generation phenotyping of electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>117</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22955496"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001145</pub-id>
          <pub-id pub-id-type="medline">22955496</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2012-001145</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Birkhead</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Klompas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NR</given-names>
            </name>
          </person-group>
          <article-title>Uses of electronic health records for public health surveillance to advance public health</article-title>
          <source>Annu Rev Public Health</source>
          <year>2015</year>
          <month>03</month>
          <day>18</day>
          <volume>36</volume>
          <fpage>345</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-publhealth-031914-122747</pub-id>
          <pub-id pub-id-type="medline">25581157</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vohra</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Apache Parquet</article-title>
          <source>Practical Hadoop Ecosystem: A Definitive Guide to Hadoop-Related Frameworks and Tools</source>
          <year>2016</year>
          <publisher-loc>Berkeley, CA</publisher-loc>
          <publisher-name>Apress</publisher-name>
          <fpage>325</fpage>
          <lpage>35</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <article-title>Apache parquet documentation</article-title>
          <source>Apache Software Foundation</source>
          <access-date>2025-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://parquet.apache.org/">https://parquet.apache.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meystre</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Friedlin</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Samore</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Automatic de-identification of textual documents in the electronic health record: a review of recent research</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2010</year>
          <month>08</month>
          <day>02</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>70</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-10-70"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2288-10-70</pub-id>
          <pub-id pub-id-type="medline">20678228</pub-id>
          <pub-id pub-id-type="pii">1471-2288-10-70</pub-id>
          <pub-id pub-id-type="pmcid">PMC2923159</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Negash</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Neilson</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Moni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nesca</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Enns</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>De-identification of free text data containing personal health information: a scoping review of reviews</article-title>
          <source>Int J Popul Data Sci</source>
          <year>2023</year>
          <month>12</month>
          <day>12</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>2153</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38414537"/>
          </comment>
          <pub-id pub-id-type="doi">10.23889/ijpds.v8i1.2153</pub-id>
          <pub-id pub-id-type="medline">38414537</pub-id>
          <pub-id pub-id-type="pii">8:1:29</pub-id>
          <pub-id pub-id-type="pmcid">PMC10898315</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kushida</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Nichols</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Jadrnicek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Griffin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Strategies for de-identification and anonymization of electronic health record data for use in multicenter research studies</article-title>
          <source>Med Care</source>
          <year>2012</year>
          <month>07</month>
          <volume>50 Suppl</volume>
          <issue>Suppl</issue>
          <fpage>S82</fpage>
          <lpage>101</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22692265"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e3182585355</pub-id>
          <pub-id pub-id-type="medline">22692265</pub-id>
          <pub-id pub-id-type="pii">00005650-201207001-00017</pub-id>
          <pub-id pub-id-type="pmcid">PMC6502465</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>El-Hayek</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Barzegar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Faux</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Doyle</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pillai</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mutch</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vaisey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sanci</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Hellard</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Hocking</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Verspoor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Boyle</surname>
              <given-names>DI</given-names>
            </name>
          </person-group>
          <article-title>An evaluation of existing text de-identification tools for use with patient progress notes from Australian general practice</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <month>05</month>
          <volume>173</volume>
          <fpage>105021</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105021</pub-id>
          <pub-id pub-id-type="medline">36870249</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(23)00038-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnagaddala</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>OpenDeID pipeline for unstructured electronic health record text notes based on rules and transformers: deidentification algorithm development and validation study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>12</month>
          <day>06</day>
          <volume>25</volume>
          <fpage>e48145</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e48145/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48145</pub-id>
          <pub-id pub-id-type="medline">38055317</pub-id>
          <pub-id pub-id-type="pii">v25i1e48145</pub-id>
          <pub-id pub-id-type="pmcid">PMC10733816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jabet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bérot</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chiarabini</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dellière</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bosshard</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Siguier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tubiana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Favier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Canestri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Makhloufi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nouchi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>de Risi-Pugliese</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Boquel</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Crémer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Khoury</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sidali</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Hamane</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Benderdouche</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Palous</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chasset</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gräser</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hubka</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Fekkar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hennequin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Piarroux</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Normand</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Monsel</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Trichophyton mentagrophytes ITS genotype VII infections among men who have sex with men in France: an ongoing phenomenon</article-title>
          <source>J Eur Acad Dermatol Venereol</source>
          <year>2025</year>
          <month>02</month>
          <volume>39</volume>
          <issue>2</issue>
          <fpage>407</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1111/jdv.20439</pub-id>
          <pub-id pub-id-type="medline">39587983</pub-id>
          <pub-id pub-id-type="pmcid">PMC11760687</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crane</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Nance</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ruderman</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Drumright</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Mixson</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Heckbert</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Feinstein</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Budoff</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bamford</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cachay</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Napravnik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Keruly</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Willig</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Burkholder</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fredericksen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Saag</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Chander</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kitahata</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Crothers</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>O'Cleirigh</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cropsey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Whitney</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Delaney</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Smoking and type 1 versus type 2 myocardial infarction among people with HIV in the United States: results from the center for AIDS research network integrated clinical systems cohort</article-title>
          <source>J Assoc Nurses AIDS Care</source>
          <year>2024</year>
          <month>09</month>
          <day>6</day>
          <volume>35</volume>
          <issue>6</issue>
          <fpage>507</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1097/JNC.0000000000000492</pub-id>
          <pub-id pub-id-type="medline">39241219</pub-id>
          <pub-id pub-id-type="pii">00001782-202412000-00005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dauber-Decker</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Coleman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Persaud</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chelico</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Spyropoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McGinn</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Integrating clinical decision support into electronic health record systems using a novel platform (EvidencePoint): developmental study</article-title>
          <source>JMIR Form Res</source>
          <year>2023</year>
          <month>10</month>
          <day>19</day>
          <volume>7</volume>
          <fpage>e44065</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2023//e44065/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/44065</pub-id>
          <pub-id pub-id-type="medline">37856193</pub-id>
          <pub-id pub-id-type="pii">v7i1e44065</pub-id>
          <pub-id pub-id-type="pmcid">PMC10623239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trinkley</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Kroehl</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Hale</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Haugen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Heckman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Matlock</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Page Nd</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Stine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Suresh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Applying clinical decision support design best practices with the practical robust implementation and sustainability model versus reliance on commercially available clinical decision support tools: randomized controlled trial</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>03</month>
          <day>22</day>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>e24359</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/3/e24359/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24359</pub-id>
          <pub-id pub-id-type="medline">33749610</pub-id>
          <pub-id pub-id-type="pii">v9i3e24359</pub-id>
          <pub-id pub-id-type="pmcid">PMC8077777</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rhee</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>WC</given-names>
            </name>
          </person-group>
          <article-title>Alert override patterns with a medication clinical decision support system in an academic emergency department: retrospective descriptive study</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <month>11</month>
          <day>04</day>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>e23351</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/11/e23351/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23351</pub-id>
          <pub-id pub-id-type="medline">33146626</pub-id>
          <pub-id pub-id-type="pii">v8i11e23351</pub-id>
          <pub-id pub-id-type="pmcid">PMC7673981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Min</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Biondich</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Faxvaag</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rennert</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hubig</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gimbel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Ontologies applied in clinical decision support system rules: systematic review</article-title>
          <source>JMIR Med Inform</source>
          <year>2023</year>
          <month>01</month>
          <day>19</day>
          <volume>11</volume>
          <fpage>e43053</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2023//e43053/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/43053</pub-id>
          <pub-id pub-id-type="medline">36534739</pub-id>
          <pub-id pub-id-type="pii">v11i1e43053</pub-id>
          <pub-id pub-id-type="pmcid">PMC9896360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sommers</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Tolle</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Trinkley</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Johnston</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Dietsche</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Eldred</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Wick</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Hoppe</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Clinical decision support to increase emergency department Naloxone Coprescribing: implementation report</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>11</month>
          <day>06</day>
          <volume>12</volume>
          <fpage>e58276</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e58276/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/58276</pub-id>
          <pub-id pub-id-type="medline">39504560</pub-id>
          <pub-id pub-id-type="pii">v12i1e58276</pub-id>
          <pub-id pub-id-type="pmcid">PMC11560079</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barton</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maru</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leaf</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Hekman</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wiegmann</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>BW</given-names>
            </name>
          </person-group>
          <article-title>Academic detailing as a health information technology implementation method: supporting the design and implementation of an emergency department-based clinical decision support tool to prevent future falls</article-title>
          <source>JMIR Hum Factors</source>
          <year>2024</year>
          <month>04</month>
          <day>18</day>
          <volume>11</volume>
          <fpage>e52592</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://humanfactors.jmir.org/2024//e52592/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52592</pub-id>
          <pub-id pub-id-type="medline">38635318</pub-id>
          <pub-id pub-id-type="pii">v11i1e52592</pub-id>
          <pub-id pub-id-type="pmcid">PMC11066751</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Machine learning models with prognostic implications for predicting gastrointestinal bleeding after coronary artery bypass grafting and guiding personalized medicine: multicenter cohort study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>03</month>
          <day>06</day>
          <volume>27</volume>
          <fpage>e68509</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e68509/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/68509</pub-id>
          <pub-id pub-id-type="medline">40053791</pub-id>
          <pub-id pub-id-type="pii">v27i1e68509</pub-id>
          <pub-id pub-id-type="pmcid">PMC11926454</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mamandipoor</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fjølner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bruno</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Wernly</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Artigas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bollen Pinto</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Schefold</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Wolff</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kelm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Beil</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sviri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>van Heerden</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Szczeklik</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Czuczwar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Joannidis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Oeyen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zafeiridis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Marsh</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>FH</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cecconi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leaver</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>De Lange</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Guidet</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Flaatten</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Osmani</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Disease-course adapting machine learning prognostication models in elderly patients critically ill with COVID-19: multicenter cohort study with external validation</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>03</month>
          <day>31</day>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>e32949</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/3/e32949/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/32949</pub-id>
          <pub-id pub-id-type="medline">35099394</pub-id>
          <pub-id pub-id-type="pii">v10i3e32949</pub-id>
          <pub-id pub-id-type="pmcid">PMC9015783</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alvarez-Romero</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez-Garcia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ternero Vega</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Díaz-Jimènez</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jimènez-Juan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nieto-Martín</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Román Villarán</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kovacevic</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bokan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hromis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Djekic Malbasa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Beslać</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zaric</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gencturk</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sinaci</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Ollero Baturone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Parra Calderón</surname>
              <given-names>CL</given-names>
            </name>
          </person-group>
          <article-title>Predicting 30-day readmission risk for patients with chronic obstructive pulmonary disease through a federated machine learning architecture on Findable, Accessible, Interoperable, and Reusable (FAIR) data: development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>06</month>
          <day>02</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e35307</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/6/e35307/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35307</pub-id>
          <pub-id pub-id-type="medline">35653170</pub-id>
          <pub-id pub-id-type="pii">v10i6e35307</pub-id>
          <pub-id pub-id-type="pmcid">PMC9204581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blasi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bordonaro</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Serretta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Piazza</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Firenze</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gebbia</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Virtual clinical and precision medicine tumor boards-cloud-based platform-mediated implementation of multidisciplinary reviews among oncology centers in the COVID-19 era: protocol for an observational study</article-title>
          <source>JMIR Res Protoc</source>
          <year>2021</year>
          <month>09</month>
          <day>10</day>
          <volume>10</volume>
          <issue>9</issue>
          <fpage>e26220</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2021/9/e26220/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26220</pub-id>
          <pub-id pub-id-type="medline">34387553</pub-id>
          <pub-id pub-id-type="pii">v10i9e26220</pub-id>
          <pub-id pub-id-type="pmcid">PMC8437400</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shahzad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Naseem</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the effectiveness of data governance frameworks in ensuring security and privacy of healthcare data: a quantitative analysis of ISO standards, GDPR, and HIPAA in blockchain technology</article-title>
          <source>PLoS One</source>
          <year>2025</year>
          <month>5</month>
          <day>23</day>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>e0324285</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0324285"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0324285</pub-id>
          <pub-id pub-id-type="medline">40408373</pub-id>
          <pub-id pub-id-type="pii">PONE-D-24-54554</pub-id>
          <pub-id pub-id-type="pmcid">PMC12101661</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bradford</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aboy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liddell</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>International transfers of health data between the EU and USA: a sector-specific approach for the USA to ensure an 'adequate' level of protection</article-title>
          <source>J Law Biosci</source>
          <year>2020</year>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>lsaa055</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34221424"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jlb/lsaa055</pub-id>
          <pub-id pub-id-type="medline">34221424</pub-id>
          <pub-id pub-id-type="pii">lsaa055</pub-id>
          <pub-id pub-id-type="pmcid">PMC8249089</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gomase</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Ghatule</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sardana</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Cybersecurity and compliance in clinical trials: the role of artificial intelligence in secure healthcare management</article-title>
          <source>Rev Recent Clin Trials</source>
          <year>2025</year>
          <month>04</month>
          <day>25</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>332</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.2174/0115748871366467250413070850</pub-id>
          <pub-id pub-id-type="medline">40277117</pub-id>
          <pub-id pub-id-type="pii">RRCT-EPUB-147950</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scheibner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Raisaro</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Troncoso-Pastoriza</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Ienca</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fellay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vayena</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hubaux</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Revolutionizing medical data sharing using advanced privacy-enhancing technologies: technical, legal, and ethical synthesis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>02</month>
          <day>25</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>e25120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/2/e25120/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25120</pub-id>
          <pub-id pub-id-type="medline">33629963</pub-id>
          <pub-id pub-id-type="pii">v23i2e25120</pub-id>
          <pub-id pub-id-type="pmcid">PMC7952236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Broen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Trangucci</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zelner</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Measuring the impact of spatial perturbations on the relationship between data privacy and validity of descriptive statistics</article-title>
          <source>Int J Health Geogr</source>
          <year>2021</year>
          <month>01</month>
          <day>07</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ij-healthgeographics.biomedcentral.com/articles/10.1186/s12942-020-00256-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12942-020-00256-8</pub-id>
          <pub-id pub-id-type="medline">33413390</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12942-020-00256-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7788553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Automatic ICD-10 coding and training system: deep neural network based on supervised learning</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>08</month>
          <day>31</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e23230</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/8/e23230/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23230</pub-id>
          <pub-id pub-id-type="medline">34463639</pub-id>
          <pub-id pub-id-type="pii">v9i8e23230</pub-id>
          <pub-id pub-id-type="pmcid">PMC8441604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Automatic international classification of diseases coding system: deep contextualized language model with rule-based approaches</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>06</month>
          <day>29</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e37557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/6/e37557/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37557</pub-id>
          <pub-id pub-id-type="medline">35767353</pub-id>
          <pub-id pub-id-type="pii">v10i6e37557</pub-id>
          <pub-id pub-id-type="pmcid">PMC9282222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>FX</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Training a deep contextualized language model for international classification of diseases, 10th revision classification via federated learning: model development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>11</month>
          <day>10</day>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>e41342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/11/e41342/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/41342</pub-id>
          <pub-id pub-id-type="medline">36355417</pub-id>
          <pub-id pub-id-type="pii">v10i11e41342</pub-id>
          <pub-id pub-id-type="pmcid">PMC9693720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gifford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Varley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bastarache</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Theodoratou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Mapping ICD-10 and ICD-10-CM codes to phecodes: workflow development and initial evaluation</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>11</month>
          <day>29</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>e14325</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/4/e14325/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14325</pub-id>
          <pub-id pub-id-type="medline">31553307</pub-id>
          <pub-id pub-id-type="pii">v7i4e14325</pub-id>
          <pub-id pub-id-type="pmcid">PMC6911227</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Falissard</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Morgand</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosn</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Imbaud</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bounebache</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rey</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Neural translation and automated recognition of ICD-10 medical entities from natural language: model development and performance assessment</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>04</month>
          <day>11</day>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>e26353</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/4/e26353/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26353</pub-id>
          <pub-id pub-id-type="medline">35404262</pub-id>
          <pub-id pub-id-type="pii">v10i4e26353</pub-id>
          <pub-id pub-id-type="pmcid">PMC9039820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghasemi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Unsupervised feature selection to identify important ICD-10 and ATC codes for machine learning on a cohort of patients with coronary heart disease: retrospective study</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>07</month>
          <day>26</day>
          <volume>12</volume>
          <fpage>e52896</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e52896/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52896</pub-id>
          <pub-id pub-id-type="medline">39087585</pub-id>
          <pub-id pub-id-type="pii">v12i1e52896</pub-id>
          <pub-id pub-id-type="pmcid">PMC11295113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Liou</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Shain</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>WY</given-names>
            </name>
            <name name-style="western">
              <surname>Mir</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Simanjuntak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>VS</given-names>
            </name>
          </person-group>
          <article-title>Evaluating a natural language processing-driven, AI-assisted international classification of diseases, 10th revision, clinical modification, coding system for diagnosis related groups in a real hospital environment: algorithm development and validation study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>09</month>
          <day>20</day>
          <volume>26</volume>
          <fpage>e58278</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e58278/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/58278</pub-id>
          <pub-id pub-id-type="medline">39302714</pub-id>
          <pub-id pub-id-type="pii">v26i1e58278</pub-id>
          <pub-id pub-id-type="pmcid">PMC11452756</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>DuckDB documentation</article-title>
          <source>DuckDB Foundation</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://duckdb.org/">https://duckdb.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <article-title>PostgreSQL documentation</article-title>
          <source>PostgreSQL Global Development Group</source>
          <access-date>2025-06-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.postgresql.org/docs/">https://www.postgresql.org/docs/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tardío</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Maté</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Trujillo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Beyond TPC-DS, a benchmark for Big Data OLAP systems (BDOLAP-Bench)</article-title>
          <source>Futur Gener Comp Syst</source>
          <year>2022</year>
          <month>07</month>
          <volume>132</volume>
          <fpage>136</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2022.02.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhuri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Narasayya</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>DSB: a decision support benchmark for workload-driven and traditional database systems</article-title>
          <source>Proc VLDB Endow</source>
          <year>2021</year>
          <month>10</month>
          <day>28</day>
          <volume>14</volume>
          <issue>13</issue>
          <fpage>3376</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.14778/3484224.3484234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedragosa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Riera</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Casella</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Esteve-Codina</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Steuerman</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Seth</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bocharov</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Heath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gat-Viks</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Argilaguet</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meyerhans</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Linking cell dynamics with gene coexpression networks to characterize key events in chronic virus infections</article-title>
          <source>Front Immunol</source>
          <year>2019</year>
          <month>5</month>
          <day>3</day>
          <volume>10</volume>
          <fpage>1002</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31130969"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fimmu.2019.01002</pub-id>
          <pub-id pub-id-type="medline">31130969</pub-id>
          <pub-id pub-id-type="pmcid">PMC6509617</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Efficacy of web-based self-management interventions for depressive symptoms: a meta-analysis of randomized controlled trials</article-title>
          <source>BMC Psychiatry</source>
          <year>2021</year>
          <month>08</month>
          <day>11</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>398</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpsychiatry.biomedcentral.com/articles/10.1186/s12888-021-03396-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12888-021-03396-8</pub-id>
          <pub-id pub-id-type="medline">34380440</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12888-021-03396-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8359554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bugiardini</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cenko</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Sex differences in myocardial infarction deaths</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>07</month>
          <day>11</day>
          <volume>396</volume>
          <issue>10244</issue>
          <fpage>72</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31049-7</pub-id>
          <pub-id pub-id-type="medline">32445694</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)31049-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaul</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Corbett</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tofani</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Infantolino</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Clinical utility of wide-area transepithelial sampling with three-dimensional computer-assisted analysis (WATS3D) in identifying Barrett's esophagus and associated neoplasia</article-title>
          <source>Dis Esophagus</source>
          <year>2020</year>
          <month>12</month>
          <day>07</day>
          <volume>33</volume>
          <issue>12</issue>
          <fpage>32607543</fpage>
          <pub-id pub-id-type="doi">10.1093/dote/doaa069</pub-id>
          <pub-id pub-id-type="medline">32607543</pub-id>
          <pub-id pub-id-type="pii">5865411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hajaj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hardt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sundberg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Irvine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Litsch</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mossin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tansuwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wexler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volchenboum</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madabushi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scalable and accurate deep learning with electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <month>5</month>
          <day>8</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-018-0029-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id>
          <pub-id pub-id-type="medline">31304302</pub-id>
          <pub-id pub-id-type="pii">29</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Prediction modeling using EHR data: challenges, strategies, and a comparison of machine learning approaches</article-title>
          <source>Med Care</source>
          <year>2010</year>
          <month>06</month>
          <volume>48</volume>
          <issue>6 Suppl</issue>
          <fpage>S106</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e3181de9e17</pub-id>
          <pub-id pub-id-type="medline">20473190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rifkin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Klautau</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>In defense of one-vs-all classification</article-title>
          <source>J Mach Learn Res</source>
          <year>2004</year>
          <volume>5</volume>
          <fpage>41</fpage>
          <pub-id pub-id-type="doi">10.5555/1005332.1005336</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Read</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pfahringer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Classifier chains for multi-label classification</article-title>
          <source>Mach Learn</source>
          <year>2011</year>
          <month>6</month>
          <day>30</day>
          <volume>85</volume>
          <issue>3</issue>
          <fpage>333</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1007/S10994-011-5256-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>OJ</given-names>
            </name>
          </person-group>
          <article-title>Multiple comparisons among Means</article-title>
          <source>J Am Stat Assoc</source>
          <year>1961</year>
          <month>03</month>
          <volume>56</volume>
          <issue>293</issue>
          <fpage>52</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1080/01621459.1961.10482090</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bland</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
          </person-group>
          <article-title>Multiple significance tests: the Bonferroni method</article-title>
          <source>BMJ</source>
          <year>1995</year>
          <month>01</month>
          <day>21</day>
          <volume>310</volume>
          <issue>6973</issue>
          <fpage>170</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/7833759"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.310.6973.170</pub-id>
          <pub-id pub-id-type="medline">7833759</pub-id>
          <pub-id pub-id-type="pmcid">PMC2548561</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>C-reactive protein and N-terminal pro-brain natriuretic peptide discrepancy: a differentiation of adenoviral pharyngoconjunctival fever from Kawasaki disease</article-title>
          <source>Korean J Pediatr</source>
          <year>2018</year>
          <month>01</month>
          <volume>61</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29441107"/>
          </comment>
          <pub-id pub-id-type="doi">10.3345/kjp.2018.61.1.12</pub-id>
          <pub-id pub-id-type="medline">29441107</pub-id>
          <pub-id pub-id-type="pmcid">PMC5807985</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schuirmann</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>A comparison of the two one-sided tests procedure and the power approach for assessing the equivalence of average bioavailability</article-title>
          <source>J Pharmacokinet Biopharm</source>
          <year>1987</year>
          <month>12</month>
          <day>1</day>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>657</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1007/BF01068419</pub-id>
          <pub-id pub-id-type="medline">3450848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nowacki</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Understanding equivalence and noninferiority testing</article-title>
          <source>J Gen Intern Med</source>
          <year>2011</year>
          <month>02</month>
          <day>21</day>
          <volume>26</volume>
          <issue>2</issue>
          <fpage>192</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20857339"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-010-1513-8</pub-id>
          <pub-id pub-id-type="medline">20857339</pub-id>
          <pub-id pub-id-type="pmcid">PMC3019319</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rockenschaub</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Akay</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Carlisle</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Hilbert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wendland</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer-Eschenbach</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Näher</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Frey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Madai</surname>
              <given-names>VI</given-names>
            </name>
          </person-group>
          <article-title>External validation of AI-based scoring systems in the ICU: a systematic review and meta-analysis</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2025</year>
          <month>01</month>
          <day>06</day>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-024-02830-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-024-02830-7</pub-id>
          <pub-id pub-id-type="medline">39762808</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-024-02830-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC11702098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glenn</surname>
              <given-names>WB</given-names>
            </name>
          </person-group>
          <article-title>Verification of forecasts expressed in terms of probability</article-title>
          <source>Mon Weather Rev</source>
          <year>1950</year>
          <month>01</month>
          <volume>78</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1175/1520-0493(1950)078&#60;0001:vofeit&#62;2.0.co;2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dawood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sidhu</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Ruijsink</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gould</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Porter</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Elliott</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rinaldi</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Puyol-Antón</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Razavi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Uncertainty aware training to improve deep learning model calibration for classification of cardiac MR images</article-title>
          <source>Med Image Anal</source>
          <year>2023</year>
          <month>08</month>
          <volume>88</volume>
          <fpage>102861</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1361-8415(23)00121-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.media.2023.102861</pub-id>
          <pub-id pub-id-type="medline">37327613</pub-id>
          <pub-id pub-id-type="pii">S1361-8415(23)00121-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC10788705</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eelbode</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bertels</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vandermeulen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maes</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bisschops</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Blaschko</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <article-title>Optimization for medical image segmentation: theory and practice when evaluating with dice score or Jaccard index</article-title>
          <source>IEEE Trans Med Imaging</source>
          <year>2020</year>
          <month>11</month>
          <volume>39</volume>
          <issue>11</issue>
          <fpage>3679</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1109/tmi.2020.3002417</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Malin</surname>
              <given-names>BA</given-names>
            </name>
          </person-group>
          <article-title>Membership inference attacks against synthetic health data</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>01</month>
          <volume>125</volume>
          <fpage>103977</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00306-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103977</pub-id>
          <pub-id pub-id-type="medline">34920126</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00306-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8766950</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cobilean</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mavikumbure</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Drake</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Stuart</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Manic</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Investigating membership inference attacks against CNN models for BCI systems</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2025</year>
          <month>11</month>
          <volume>29</volume>
          <issue>11</issue>
          <fpage>8164</fpage>
          <lpage>74</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2025.3593443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Differential privacy protection against membership inference attack on machine learning for genomic data</article-title>
          <source>Pac Symp Biocomput</source>
          <year>2021</year>
          <volume>26</volume>
          <fpage>26</fpage>
          <lpage>37</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://psb.stanford.edu/psb-online/proceedings/psb21/abstracts/2021_p26.html"/>
          </comment>
          <pub-id pub-id-type="medline">33691001</pub-id>
          <pub-id pub-id-type="pii">9789811232701_0003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bohrson</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Barton</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Lodato</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Rodin</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Luquette</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Viswanadham</surname>
              <given-names>VV</given-names>
            </name>
            <name name-style="western">
              <surname>Gulhan</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Cortés-Ciriano</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sherman</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Coulter</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Galor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Linked-read analysis identifies mutations in single-cell DNA-sequencing data</article-title>
          <source>Nat Genet</source>
          <year>2019</year>
          <month>04</month>
          <day>18</day>
          <volume>51</volume>
          <issue>4</issue>
          <fpage>749</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30886424"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41588-019-0366-2</pub-id>
          <pub-id pub-id-type="medline">30886424</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41588-019-0366-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6900933</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luquette</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bohrson</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gulhan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ganz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bizzotto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kirkham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hochepied</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Libert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Galor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lodato</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Garaycoechea</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Gawad</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>West</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Single-cell genome sequencing of human neurons identifies somatic point mutation and indel enrichment in regulatory elements</article-title>
          <source>Nat Genet</source>
          <year>2022</year>
          <month>10</month>
          <day>26</day>
          <volume>54</volume>
          <issue>10</issue>
          <fpage>1564</fpage>
          <lpage>71</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36163278"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41588-022-01180-2</pub-id>
          <pub-id pub-id-type="medline">36163278</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41588-022-01180-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC9833626</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
