<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e59685</article-id><article-id pub-id-type="doi">10.2196/59685</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Federated Analysis With Differential Privacy in Oncology Research: Longitudinal Observational Study Across Hospital Data Warehouses</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ryffel</surname><given-names>Th&#x00E9;o</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cr&#x00E9;quit</surname><given-names>Perrine</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Baillet</surname><given-names>Ma&#x00EB;lle</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Paumier</surname><given-names>Jason</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Marfoq</surname><given-names>Yasmine</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Girardot</surname><given-names>Olivier</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chanet</surname><given-names>Thierry</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sy</surname><given-names>Ronan</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Bayssat</surname><given-names>Louise</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mazi&#x00E8;res</surname><given-names>Julien</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Vuiblet</surname><given-names>Vincent</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ancel</surname><given-names>Julien</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dewolf</surname><given-names>Maxime</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Margraff</surname><given-names>Fran&#x00E7;ois</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Bachot</surname><given-names>Camille</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chmiel</surname><given-names>Jacek</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib></contrib-group><aff id="aff1"><institution>Arkhn</institution><addr-line>9, rue d'Alexandrie</addr-line><addr-line>Paris</addr-line><country>France</country></aff><aff id="aff2"><institution>H&#x00F4;pital Foch</institution><addr-line>Suresnes</addr-line><country>France</country></aff><aff id="aff3"><institution>Centre Hospitalier Universitaire de Toulouse, Service de Pneumologie</institution><addr-line>Toulouse</addr-line><country>France</country></aff><aff id="aff4"><institution>INSERM</institution><addr-line>Paris</addr-line><country>France</country></aff><aff id="aff5"><institution>Centre de Recherches en Canc&#x00E9;rologie Oncopole</institution><addr-line>Toulouse</addr-line><country>France</country></aff><aff id="aff6"><institution>Centre Hospitalier Universitaire de Reims, Service de Pneumologie</institution><addr-line>Reims</addr-line><country>France</country></aff><aff id="aff7"><institution>Roche SAS</institution><addr-line>Boulogne</addr-line><country>France</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Imine</surname><given-names>Abdessamad</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Passerat-Palmbach</surname><given-names>Jonathan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to  Th&#x00E9;o Ryffel, PhD, Arkhn, 9, rue d'Alexandrie, Paris, 75002, France; <email>theo.ryffel@arkhn.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>31</day><month>7</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e59685</elocation-id><history><date date-type="received"><day>19</day><month>04</month><year>2024</year></date><date date-type="rev-recd"><day>09</day><month>12</month><year>2024</year></date><date date-type="accepted"><day>30</day><month>01</month><year>2025</year></date></history><copyright-statement>&#x00A9; Th&#x00E9;o Ryffel, Perrine Cr&#x00E9;quit, Ma&#x00EB;lle Baillet, Jason Paumier, Yasmine Marfoq, Olivier Girardot, Thierry Chanet, Ronan Sy, Louise Bayssat, Julien Mazi&#x00E8;res, Vincent Vuiblet, Julien Ancel, Maxime Dewolf, Fran&#x00E7;ois Margraff, Camille Bachot, Jacek Chmiel. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 31.7.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e59685"/><abstract><sec><title>Background</title><p>Federated analytics in health care allows researchers to perform statistical queries on remote datasets without access to the raw data. This method arose from the need to perform statistical analysis on larger datasets collected at multiple health care centers while avoiding regulatory, governance, and privacy issues that might arise if raw data were collected at a central location outside the health care centers. Despite some pioneering work, federated analytics is still not widely used on real-world data, and to our knowledge, no real-world study has yet combined it with other privacy-enhancing techniques such as differential privacy (DP).</p></sec><sec><title>Objective</title><p>The first objective of this study was to deploy a federated architecture in a real-world setting. The oncology study used for this deployment compared the medical health care management of patients with metastatic non&#x2013;small cell lung cancer before and after the first wave of COVID-19 pandemic. The second goal was to test DP in this real-world scenario to assess its practicality and use as a privacy-enhancing technology.</p></sec><sec sec-type="methods"><title>Methods</title><p>A federated architecture platform was set up in the Toulouse, Reims, and Foch centers. After harmonization of the data in each center, statistical analyses were performed using DataSHIELD (Data aggregation through anonymous summary-statistics from harmonized individual-level databases), a federated analysis R library, and a new open-source DP DataSHIELD package was implemented (dsPrivacy).</p></sec><sec sec-type="results"><title>Results</title><p>A total of 50 patients were enrolled in the Toulouse and Reims centers and 49 in the Foch center. We have shown that DataSHIELD is a practical tool to efficiently conduct our study across all 3 centers without exposing data on a central node, once a sufficient setup has been established to configure a secure network between hospitals. All planned aggregated results were successfully generated. We also observed that DP can be implemented in practice with promising trade-offs between privacy and accuracy, and we built a library that will prove useful for future work.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The federated architecture platform made it possible to run a multicenter study on real-world oncology data while ensuring strong privacy guarantees using differential privacy.</p></sec></abstract><kwd-group><kwd>federated analysis</kwd><kwd>differential privacy</kwd><kwd>real-world oncology study</kwd><kwd>non-small cell lung cancer</kwd><kwd>COVID-19</kwd><kwd>lung cancer</kwd><kwd>cancer</kwd><kwd>privacy</kwd><kwd>oncology</kwd><kwd>oncology study</kwd><kwd>cell lung cancer</kwd><kwd>oncology data</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Federated analytics (FA) [<xref ref-type="bibr" rid="ref1">1</xref>] allow researchers to perform statistical queries on remote datasets without accessing raw data. This method has emerged from the need of conducting statistical analyses on larger datasets originating from multiple health care centers, while avoiding regulation, governance, and privacy related issues that could occur if the raw data were gathered in a central location external to the health care centers.</p><p>DataSHIELD (Data aggregation through anonymous summary-statistics from harmonized individual-level databases) [<xref ref-type="bibr" rid="ref2">2</xref>] is one of the pioneering open-source software solutions for bioscience collaboration using federated analysis. It has been used in several projects including the EU Child Cohort Network [<xref ref-type="bibr" rid="ref3">3</xref>] and German MIRACUM consortium [<xref ref-type="bibr" rid="ref4">4</xref>]. However, even if it has been identified as a next step in some oncology studies [<xref ref-type="bibr" rid="ref5">5</xref>], to the best of our knowledge it has not been used on real-world oncology data. One possible reason for this can be that data harmonization is actually the sticking point, since it proves to be challenging on real-world data when not already done ahead of time.</p><p>While FA ensures that sensitive data are never directly exposed, results from statistical queries can still leak some information from individuals. Indeed, several privacy attacks [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>] have been proposed to exploit common statistical analysis results and disclose private information. To mitigate these attacks, differential privacy (DP) can be used in combination with FA to provide stronger privacy guarantees. DP [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>] is a method for computing statistical analyses on a sensitive dataset in such a way that the results do not compromise the privacy of the initial raw data. It proves particularly appropriate for studies on patient health data which are highly sensitive, but as far as we know, no real-world data study have already combined FA and privacy-enhancing techniques such as DP. Our study focuses on a scenario with 3 hospital nodes, consistent with typical real-world deployments in health care, where the number of participating centers is usually small (on the order of a few nodes). Scalability and performance metrics (eg, query response times and network latency) were therefore not the primary focus of this pilot.</p><p>The goal of this study, called Distributed Analytics for Research in Hospitals (DARAH), is to evaluate the operational deployment of a federated architecture in the context of a real-world oncology study. Another objective is to analyze the impact of DP in a federated analysis on the meaningfulness of the study results.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Use of DataSHIELD</title><p>At the time of starting the project, we evaluated multiple FA frameworks and chose DataSHIELD due to its comprehensive privacy controls, stable community support, and mature set of statistical functions. DataSHIELD&#x2019;s unique strength lies in its local, decentralized authorization mechanism and built-in privacy disclosure checks, which prevent analysts from executing arbitrary code on remote servers. The &#x201C;default privacy disclosure mode&#x201D; enforces a baseline set of privacy checks (eg, thresholds on minimum cell counts) that align with real-world clinical data governance needs. While other tools like NVidia FLARE or custom Python/R frameworks exist, they often lack these out-of-the-box privacy safeguards, making DataSHIELD a practical choice for our use case. We maintained the default privacy settings throughout the study to ensure a fair demonstration of DataSHIELD&#x2019;s capabilities without additional configuration.</p></sec><sec id="s2-2"><title>Use of Differential Privacy</title><p>DP provides a measurement of the privacy risk associated with publishing each particular result on a sensitive dataset, by measuring the maximum leakage that each result can cause about the individuals&#x2019; data. In practice, it often works through the addition of a controlled amount of statistical noise to obscure the contributions to the result from each individual in the dataset.</p><p>Several open-source libraries exist that implement DP, most of which are written in Python or expose a Python interface. Popular ones include Google&#x2019;s DP library [<xref ref-type="bibr" rid="ref10">10</xref>], PyDP [<xref ref-type="bibr" rid="ref11">11</xref>] from the OpenMined community and OpenDP [<xref ref-type="bibr" rid="ref12">12</xref>]. In R, the main open-source library is the diffpriv library [<xref ref-type="bibr" rid="ref13">13</xref>] that implements some DP mechanisms but not a real suite of functions ready to use, and which is not actively supported with last contributions going back to 2017. Furthermore, none of these tools were directly compatible with the DataSHIELD framework, which requires a specific interface in R. As a result, a new open-source a DP R package (R Core Team) for DataSHIELD has been implemented: dsPrivacy. It is available in the Arkhn GitHub repository<ext-link ext-link-type="uri" xlink:href="https://github.com/arkhn/dsPrivacy">.</ext-link></p><p>dsPrivacy implements common statistical operations such as mean (SD) with DP and can be directly integrated into DataSHIELD. More specifically, pure DP has been implemented, which means that the statistical noise added to the result is drawn from a Laplacian distribution. Privacy is therefore defined with a single parameter &#x201C;&#x03B5;&#x201D; (which corresponds to the inverse of the noise variance) and it is called the privacy budget. The privacy budget &#x03B5; controls the amount of noise injected in the computation and hence the privacy of the analysis, smaller the privacy budget &#x03B5;, higher the noise, which means better privacy guarantees since the private information is better covered by the noise.</p><p>DP induces a trade-off between privacy and accuracy of the analysis [<xref ref-type="bibr" rid="ref14">14</xref>] as privacy is ensured with noise, better privacy means a lower signal-to-noise ratio and less meaningful results. Conversely, when &#x03B5; is high, the noise is reduced and privacy degrades. Choosing the right value for &#x03B5; from a privacy standpoint is quite controversial [<xref ref-type="bibr" rid="ref15">15</xref>] and is highly dependent on the context and the study considered.</p><p>dsPrivacy in the context of FA works by adding Laplacian noise locally at each center on the results computed on the local datasets before results are aggregated on a central node. This is referred to as local DP, as opposed to central DP, where the noise is added after the aggregation part on the central node. This paradigm is detailed in the Discussion section.</p></sec><sec id="s2-3"><title>Use Case: Differences in the Patient Drug Exposure of Patients With Non&#x2013;Small Cell Lung Cancer Before and After the First Wave of the COVID-19 Pandemic</title><sec id="s2-3-1"><title>Context</title><p>In order to test the implementation of a federated platform with DP, a study was conducted using real-world oncology data, with the aim of analyzing the differences in the patient drug exposure of patients with non&#x2013;small cell lung cancer before and after the first wave of the COVID-19 pandemic. Specifically, the analyses were based on the first line of treatment, including its duration and disease progression at 24 months. The study was carried out in 3 hospitals: Foch Hospital, Toulouse University Hospital Center, and Reims University Hospital Center.</p></sec><sec id="s2-3-2"><title>Patient Selection</title><p>The inclusion criteria were adult patients with metastatic non&#x2013;small cell lung cancer treated with chemotherapy, immunotherapy, antiangiogenic therapy, or any combination of these treatments at Foch, Toulouse, and Reims centers between March 2019 and March 2021. The list of considered treatments is available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>The exclusion criteria included patients objecting to the reuse of their data, protected adult patients (patients under curatorship, tutorship, or advisership), patients undergoing a clinical trial, patients whose follow-up did not start in one of these centers, patients who are not immediately metastatic, and patients with an epidermal growth factor receptor mutation, anaplastic lymphoma kinase translocation, or ROS proto-oncogene 1 mutation.</p><p>For this study, the objective was to have 25 patients per period and per site (ie, 50 patients per center). Initially, patients were preselected using the inclusion criteria present in the chemotherapy prescription software CHIMIO, namely the date and type of treatment. Since the other criteria for inclusion and exclusion were not available in CHIMIO, physicians in each center manually assessed whether the patients could be included in the study.</p></sec><sec id="s2-3-3"><title>Variables</title><p>In this study, the variables of interest were the duration of the first line of treatment and the disease progression at 24 months following or during the first line of treatment. The start of a second line of treatment or death following (before the start of a second line) or during the first line of treatment were the proxies used for disease progression at 24 months. These events had to have occurred during the observation period, which was 2 years after the patient&#x2019;s inclusion in the study. The explanatory variable was the patient&#x2019;s inclusion period, before the first wave of COVID-19 (March 1, 2019, to March 1, 2020) or after the first wave of COVID-19 (March 2, 2020, to March 31, 2021). Some potential confounders were also studied, such as age, gender, BMI, blood creatinine level, and type of treatment. All these variables were extracted from the CHIMIO software and are listed in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p></sec><sec id="s2-3-4"><title>Data Harmonization</title><p>In this study, a physician visited each participating site to ensure consistent variable definitions, coding standards, and data formats. We chose Fast Healthcare Interoperability Resources (FHIR) as the initial data standard [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], due to its maturity and support in oncology, and the data model is available in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. Harmonization involved reviewing data dictionaries at each hospital, resolving semantic ambiguities (eg, different coding for treatments), and ensuring uniform data types and units. This manual process, though time-consuming, proved crucial for producing a common dataset compatible with federated queries. In future implementations, automated or semiautomated harmonization workflows, potentially protected by DP to further safeguard patient privacy during preprocessing, could streamline this step. To facilitate the analyses, a tabularized version of the FHIR standard has been produced and the correspondence between the variables of interest used in the datasets and the FHIR attributes are presented in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p></sec><sec id="s2-3-5"><title>Statistical Definition Without Differential Privacy</title><p>First, univariate and bivariate descriptive statistics were performed for the variables of interest, the explanatory variables and the confounding factors. For the qualitative variables, percentages per category were calculated. For the quantitative variables, the mean but also the 5th, 25th, 50th, 75th, and 95th percentiles were computed. The minimums and maximums were not computed because these values are considered disclosive (eg, the presence of an outlier) in DataSHIELD standard configuration.</p><p>Then, to ensure the absence of confounding factors, covariates for which there was a difference between the 2 groups (before and after the first COVID-19 wave) in bivariate analysis with a <italic>P</italic> value of &#x003C;.20 were included in the multivariate models. A Student <italic>t</italic> test was used for quantitative variables. A chi-square test was used for qualitative variables with at least 5 elements in each class. Otherwise, a Fisher test was used.</p><p>Finally, to investigate a difference in management between patients in the first and second waves, a linear regression was performed. The variable of interest was the duration of first-line treatment at the metastatic stage and the explanatory variable was the period (before or after the first wave). The duration of treatment was defined as the period from day 1 to the last day of the first line. A multivariate survival analysis (Cox model) was also performed in which the event of interest was the disease progression at 24 months. The explanatory variable was also the period (before or after the first wave). Potential confounders identified in the previous step were included in both multivariate analyses. A difference was considered significant if the CI did not contain 1 for linear regression and survival analysis.</p></sec><sec id="s2-3-6"><title>Statistical Definition With Differential Privacy</title><p>The univariate and bivariate statistical analyses presented in above were also performed with DP. The global strategy used to implement DP has been discussed in &#x201C;Use of Differential Privacy&#x201D; section and some details for each part of the study are detailed here.</p><p>All the univariate analyses run code from PyDP [<xref ref-type="bibr" rid="ref11">11</xref>] that we wrapped in dsPrivacy. As adding DP preserves privacy, the minimum and maximum values could be computed instead of 5th and 95th percentiles. Then bivariate analyses were carried out. For quantitative variables, an implementation of the Student <italic>t</italic> test is used and from the result of this test, a <italic>P</italic> value is inferred. For qualitative variables, occurrence tables are computed (under the hood, the function tableDP from DPPack [<xref ref-type="bibr" rid="ref18">18</xref>] is used in each center and all the tables are summed) and then a chi-square or Fisher test is performed with the R functions &#x201C;chisq.test&#x201D; and &#x201C;fisher.test.&#x201D; Linear regression and Cox models were not implemented with DP.</p><p>Determining appropriate &#x03B5; values is challenging and context-dependent. In this study, our priority was to maintain analytical use. After testing lower &#x03B5; values (closer to 1) that yielded excessive noise and unusable results, we selected <italic>&#x03B5;</italic>=5.0 for univariate analyses and <italic>&#x03B5;</italic>=60.0 for complex operations like the Student <italic>t</italic> tests. While <italic>&#x03B5;</italic>=60.0 is higher than common DP standards in theoretical literature, this choice reflects our small sample size (~50 patients/center) and the need to ensure meaningful statistical inference. In scenarios with more patients or improved aggregation techniques (eg, secure aggregation enabling central DP), lower &#x03B5; values could be achieved. As this was a feasibility study, we highlight that future work should explore more advanced DP mechanisms, larger sample sizes, and improved cryptographic methods to reduce the required privacy budget.</p></sec></sec><sec id="s2-4"><title>Ethical Considerations</title><p>From an ethical and regulatory standpoint, this study complied with the MR-004 reference methodology and adhered to GDPR requirements since DP alone does not classify data as anonymized under current regulatory frameworks. However, the use of DP strengthens data protection, and aligns with emerging privacy regulations by minimizing data exposure risks. These regulatory environments emphasize data sovereignty, patient consent, and robust security, all of which are supported by our federated, privacy-enhancing architecture. All patients enrolled in this study were informed individually, and those who exercised their right to opt out were removed from the study. This is an observational study and the research ethics committees of all three centers in Toulouse, Reims, and Foch have confirmed that no ethical approval is required and have authorized this project on their patient data.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Deployment of Federated Architecture in the Three Centers</title><p>The schema of our federated architecture is given in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Researchers connect through a VPN to a central node hosted on a cloud provider&#x2013;certified ISO (International Organization for Standardization) 27001 standard. This central node coordinates the execution of the queries on the remote data assets hosted in the different hospitals and aggregate all the responses received. Each hospital exposes through the private network pseudonymized datasets, which originate from their local harmonized data architecture, but which are completely isolated on a dedicated infrastructure for security purposes. Each hospital receives and executes remote requests from the central node that match local permissions set in DataSHIELD regarding data assets, authorized functions, and legitimate users. This ensures that hospitals keep full sovereignty on how their data are exploited.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Federated architecture diagram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e59685_fig01.png"/></fig><p>One key element is deploying a secure private network between all stakeholders, ensuring that each hospital only exposes pseudonymized data within a controlled environment. Although these pseudonymized datasets were not themselves protected by DP before analysis (since DP is applied at query-time), the secure network, encryption (TLS), and isolation measures minimize risks. We did not use &#x201C;Let&#x2019;s Encrypt&#x201D; for certificates due to internal security policies favoring certificates from recognized authorities and the controlled VPN environment lacking public domain validation. Instead, a custom approach using a trusted certificate authority provided both strong authentication and encryption tailored to our network configuration.</p></sec><sec id="s3-2"><title>Flowchart</title><p>The flowchart is presented in <xref ref-type="fig" rid="figure2">Figure 2</xref>. In total, 75 and 74 patients from respectively before and after the first wave were included in the analysis comparing disease progression. Of the patients in the period before, 63 had progressed, 9 were progression-free, and 3 had changed groups during the observation period and were therefore censored at the time of transfer. Of the patients in the period after, 55 had progressed, 17 were progression-free and 2 had changed groups during the observation period and were therefore censored at the time of transfer. Thus, after exclusion of patients who changed centers, 72 patients from each period were included in the analysis of the duration of the first line of treatment.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Patient selection and exclusion process between two periods: before and after the first wave (BW and AW).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e59685_fig02.png"/></fig></sec><sec id="s3-3"><title>Bivariate Analysis and Selection of Potential Confounders</title><p>Combined univariate analyses without and those with DP are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. Combined bivariate analyses without and with DP are presented in <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>, respectively. Direct comparison between DP and no-DP analyses across all periods is available in <xref ref-type="table" rid="table3">Table 3</xref>. In analysis without and with DP, the covariates selected for multivariate analyses were the treatment type (&#x003C;.001) only.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Bivariate analyses without differential privacy.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom">Patients (period before; n=75)</td><td align="left" valign="bottom">Patients (period after; n=74)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Variables of interest</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Disease progression, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.21</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">12 (16)</td><td align="left" valign="top">19 (25.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">63 (84)</td><td align="left" valign="top">55 (74.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>First line duration (days)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.09</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">179.7 (267.1)</td><td align="left" valign="top">255.2 (274.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median (IQR)</td><td align="left" valign="top">75.7 (14.7&#x2010;190)</td><td align="left" valign="top">141.8 (45.1&#x2010;420.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5th and 95th percentiles</td><td align="left" valign="top">0&#x2010;592.4</td><td align="left" valign="top">15&#x2010;792.8</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing, n (%)</td><td align="left" valign="top">(0)</td><td align="left" valign="top">(0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="3">Covariables</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Organization, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Toulouse University Hospital</td><td align="left" valign="top">25 (33.3)</td><td align="left" valign="top">25 (33.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Reims University Hospital</td><td align="left" valign="top">25 (33.3)</td><td align="left" valign="top">25 (33.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Foch Hospital</td><td align="left" valign="top">25 (33.3)</td><td align="left" valign="top">24 (32.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gender, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.79</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">33 (44)</td><td align="left" valign="top">30 (40.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">42 (56)</td><td align="left" valign="top">44 (59.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age (years), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.38</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;55</td><td align="left" valign="top">12 (16)</td><td align="left" valign="top">10 (13.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>55&#x2010;65</td><td align="left" valign="top">30 (40)</td><td align="left" valign="top">23 (31.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;65</td><td align="left" valign="top">33 (44)</td><td align="left" valign="top">41 (55.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>BMI (kg/m&#x00B2;), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.39</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;18.5</td><td align="left" valign="top">13 (17.3)</td><td align="left" valign="top">19 (25.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>18.5&#x2010;25</td><td align="left" valign="top">34 (45.3)</td><td align="left" valign="top">27 (36.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;25</td><td align="left" valign="top">28 (37.3)</td><td align="left" valign="top">28 (37.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Treatment category, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy</td><td align="left" valign="top">46 (61.3)</td><td align="left" valign="top">30 (40.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+angiogenesis inhibitor</td><td align="left" valign="top">6 (8)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+immunotherapy</td><td align="left" valign="top">7 (9.3)</td><td align="left" valign="top">33 (44.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Immunotherapy</td><td align="left" valign="top">16 (21.3)</td><td align="left" valign="top">11 (14.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Creatinemia (&#x00B5;mol/l)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.47</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">66.7 (20.3)</td><td align="left" valign="top">64.3 (18.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median (IQR)</td><td align="left" valign="top">60.0 (54.7&#x2010;73.3)</td><td align="left" valign="top">63.7 (55.1&#x2010;73.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5th and 95th percentiles</td><td align="left" valign="top">46.7&#x2010;98.8</td><td align="left" valign="top">41.1&#x2010;82.8</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing, n (%)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (1.4)</td><td align="left" valign="top"/></tr></tbody></table></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Bivariate analyses with differential privacy.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom">Patients (period before)</td><td align="left" valign="bottom">Patients (period after)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Variables of interest</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Disease progression (<italic>&#x03B5;<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></italic>=5.0), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">12 (16)</td><td align="left" valign="top">18 (24.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">63 (84)</td><td align="left" valign="top">55 (75.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Firstline duration (days<break/>; <italic>&#x03B5;</italic>=5.0, except <italic>P</italic> value: <italic>&#x03B5;</italic>=60.0)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.051</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">189.5 (231.1)</td><td align="left" valign="top">287.4 (286.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median</td><td align="left" valign="top">81.8</td><td align="left" valign="top">132.6</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Range</td><td align="left" valign="top">0.3&#x2010;1359.5</td><td align="left" valign="top">8.5&#x2010;827.1</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="3">Covariables</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gender (<italic>&#x03B5;</italic>=5.0), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.92</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">32 (43.2)</td><td align="left" valign="top">30 (41.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">42 (56.6)</td><td align="left" valign="top">43 (58.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age (years; <italic>&#x03B5;</italic>=5.0), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.37</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;55</td><td align="left" valign="top">12 (16.2)</td><td align="left" valign="top">10 (13.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>55&#x2010;65</td><td align="left" valign="top">29 (39.2)</td><td align="left" valign="top">22 (30.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;65</td><td align="left" valign="top">33 (44.6)</td><td align="left" valign="top">41 (56.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>BMI (kg/m&#x00B2;; <italic>&#x03B5;</italic>=5.0), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.38</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;18.5</td><td align="left" valign="top">13 (17.1)</td><td align="left" valign="top">19 (25.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>18.5&#x2010;25</td><td align="left" valign="top">34 (44.7)</td><td align="left" valign="top">27 (36.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;25</td><td align="left" valign="top">29 (38.2)</td><td align="left" valign="top">28 (37.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Treatment category (<italic>&#x03B5;</italic>=5.0), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy</td><td align="left" valign="top">46 (61.3)</td><td align="left" valign="top">31 (39.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+angiogenesis inhibitor</td><td align="left" valign="top">6 (8)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+immunotherapy</td><td align="left" valign="top">7 (9.3)</td><td align="left" valign="top">35 (44.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Immunotherapy</td><td align="left" valign="top">16 (21.3)</td><td align="left" valign="top">12 (15.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Creatinemia (&#x00B5;mol/L)<break/>(<italic>&#x03B5;</italic>=5.0 except for <italic>P</italic> value: <italic>&#x03B5;</italic>=60.0)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.53</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">65.4 (18.9)</td><td align="left" valign="top">61.9 (17.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median</td><td align="left" valign="top">64.4</td><td align="left" valign="top">65.4</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Range</td><td align="left" valign="top">48.8&#x2010;88.9</td><td align="left" valign="top">37.4&#x2010;86.1</td><td align="left" valign="top"/></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup> <italic>&#x03B5;</italic>: privacy budget.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparison of bivariate analyses across all periods (<named-content content-type="#e51c23"/>before and after), with and without differential privacy.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom">Global results (before and after combined) without DP<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">Global results (before and after combined) with DP (<italic>&#x03B5;<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></italic>=5.0)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Variables of interest</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Disease progression, n</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">31</td><td align="left" valign="top">31</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">118</td><td align="left" valign="top">118</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>First-line duration (days)</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">217.2 (269.4)</td><td align="left" valign="top">198.9 (286)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median</td><td align="left" valign="top">113.5</td><td align="left" valign="top">126.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Range</td><td align="left" valign="top">0.5&#x2010;785.6</td><td align="left" valign="top">0.1&#x2010;524.8</td></tr><tr><td align="left" valign="top" colspan="3">Covariables</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gender, n (%)</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">63</td><td align="left" valign="top">63</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">86</td><td align="left" valign="top">87</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age (years), n</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;55</td><td align="left" valign="top">22</td><td align="left" valign="top">21</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>55&#x2010;65</td><td align="left" valign="top">53</td><td align="left" valign="top">52</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;65</td><td align="left" valign="top">74</td><td align="left" valign="top">75</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>BMI (kg/m&#x00B2;), n</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;18.5</td><td align="left" valign="top">32</td><td align="left" valign="top">32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>18.5&#x2010;25</td><td align="left" valign="top">61</td><td align="left" valign="top">61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;25</td><td align="left" valign="top">56</td><td align="left" valign="top">56</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Treatment category, n</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy</td><td align="left" valign="top">76</td><td align="left" valign="top">76</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+ angiogenesis inhibitor</td><td align="left" valign="top">6</td><td align="left" valign="top">6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy+ immunotherapy</td><td align="left" valign="top">40</td><td align="left" valign="top">41</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Immunotherapy</td><td align="left" valign="top">27</td><td align="left" valign="top">27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Creatinemia (&#x00B5;mol/L)</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">65.5 (19.6)</td><td align="left" valign="top">64.6 (15.15)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median</td><td align="left" valign="top">62.3</td><td align="left" valign="top">64.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Range</td><td align="left" valign="top">43.9&#x2010;92.8</td><td align="left" valign="top">45.6&#x2010;83.7</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup> DP: differential privacy.</p></fn><fn id="table3fn2"><p><sup>b</sup> <italic>&#x03B5;</italic>: privacy budget.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Comparison of the Progression Between Two Periods (Cox Model)</title><p>In the analysis without DP, the hazard ratio of the cox model for the period before compared with the period after the first wave was 0.98 (95% CI 0.65-1.46). As the 95% CI includes 1, the two periods were not considered significantly different in terms of disease progression at 24 months after adjustment for a significant covariate (treatment type).</p></sec><sec id="s3-5"><title>Comparison of the Duration of the First Line of Treatment Between the Two Periods (Linear Regression)</title><p>In the analysis without DP, the coefficient of linear regression for the first period compared with the second one was &#x2013;13.84 (95% CI &#x2013;103.82 to 76.14). As the CI includes 1, the two periods were not considered significantly different in terms of first line duration after adjustment for significant covariate (treatment type).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, a federated analysis with and without DP was performed on a real-world study in oncology. The real-world study showed consistent results in both settings. In particular, identical conclusions were drawn regarding the lack of difference in first-line treatment duration and disease progression at 24 months in non&#x2013;small cell lung cancer patients treated before or after the first wave of COVID-19 pandemic.</p><p>Real-world deployment in 3 centers has shed light on some key aspects in terms of security. Regarding tools, DataSHIELD offers a lot of flexibility as it allows the use of custom libraries such as dsPrivacy implemented as part of this study. The downside is that community libraries are not always well maintained and bugs can be encountered (eg, dsStats had to be fixed manually). DataSHIELD builds upon Opal [<xref ref-type="bibr" rid="ref19">19</xref>], a convenient data management application which comes with straightforward but very satisfactory user management and makes it easy to configure access to specific data to specific users. Opal is also secured by design and enforces many good security practices like CSRF (Cross-Site Request Forgery) and HTTPS usage. However, available docker images to deploy it have several major known security vulnerabilities and do not seem regularly updated. Regarding network configuration, setting up strong security standards across all sites has proved challenging. An IpSec bridge was set up to enable secure communication between the central node and the hospitals. Communication among all stakeholders was a key factor for this step and formal processes (network schema, requirements formalization, debugging methods, and so on) proved decisive in order to facilitate discussions. Regarding certificates to secure communications inside the private network, the primary intention was to use certificates signed by hospitals internal certificate authority because it would not match our security requirements so certificates signed by public certificate authority have been claimed. Some hospitals provided a Sertigo certificate but it was not natively recognized by the central node server. Another hospital used instead a public certificate generated by the central node manager (Arkhn). This last solution has proven to be the best solution in terms of efficiency and security, even if the domain names covered by these certificates are not representing the actual ownership of hosts.</p><p>Regarding data standards, we chose FHIR, since it appeared to be the most mature health standard in oncology at the beginning of this project [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. However, Observational Medical Outcomes Partnership (OMOP) is developing extensions for oncology and is rapidly closing the gap [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. As the FHIR standard corresponds to json files that are not very suitable for analytical purposes, we anticipate that moving to OMOP will be more convenient for future analyses.</p><p>Overall, our experience suggests that the most time and work intensive parts are building harmonized data models locally and setting up the network infrastructure. As both these steps are agnostic of the study considered, we anticipate that they can be easily leveraged to scale the number of studies carried out on this infrastructure.</p><p>On the DP side, it has been decided not to perform linear regression and Cox models with DP because implementing it with a moderate privacy budget was deemed too complex. Privacy budgets used in this study (especially for computing the <italic>P</italic> values) are quite high compared with the literature [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], in order to achieve reasonable accuracy on differentially private results but we have shown that we are able to derive similar results compared with plain FA. As underlined above, the appropriate level of privacy is highly dependent on the context considered. Here, given that this study was already compliant to the French MR-004 methodology without DP, DP was used by prioritizing usefulness over privacy. In other contexts, especially if DP becomes recognized as a legitimate and safe technology to process personal data, and hence benefits from a dedicated regulatory status, lower privacy budgets will probably be required (alongside privacy-focused pen tests). We have identified 3 directions to achieve this. The first direction is to increase the number of patients per center. This is the most straightforward option to improve the privacy vs accuracy trade-off, since the amount of noise to add to reach a certain privacy budget &#x03B5; directly depends on the number of individuals. We have included close to 50 patients per center, which is quite low especially for some budget intensive operations for which we estimate that a thousand patients would be adapted. Second, by using central DP. If the noise is added on the central node, it is computed considering the sum of the patients across all the centers and enables lower noise for the same privacy budget. This is especially powerful if many centers are participating in the federated analysis. However, this means that by default the central node can see the contribution of each center without any noise which is a privacy breach if it cannot be trusted. A common solution is to implement secure aggregation [<xref ref-type="bibr" rid="ref23">23</xref>], meaning that all contributions are hidden and are only disclosed after the aggregation operation, using cryptographic mechanisms such as secure multiparty computation [<xref ref-type="bibr" rid="ref24">24</xref>], homomorphic encryption [<xref ref-type="bibr" rid="ref25">25</xref>], or functional encryption [<xref ref-type="bibr" rid="ref26">26</xref>]. Secure aggregation is not yet implemented in dsPrivacy and is left as future work. Finally, it can be achieved by improving the DP mechanism. We have used pure or &#x03B5;-DP, which is a simple mechanism and which makes composition very simple, since the privacy budget of a sequence of operations is the sum of the budget of each operation. More complex mechanisms such as (&#x03B5;, &#x03B4;)-DP [<xref ref-type="bibr" rid="ref6">6</xref>] or R&#x00E9;nyi DP [<xref ref-type="bibr" rid="ref27">27</xref>] provide more optimized composition properties [<xref ref-type="bibr" rid="ref28">28</xref>] that allow for a tighter privacy budget management.</p></sec><sec id="s4-2"><title>Conclusions</title><p>The DARAH project illustrates FA are a practical method to conduct scientific projects while improving data privacy, by keeping patient data stored in the hospitals and leveraging their already existing data architecture. It highlights some key challenges to be anticipated and possible answers to ensure the success of this type of projects. It also shows that DP can be used in addition to FA to improve privacy guarantees, but more experimentation is needed to develop guidelines and best practices, especially around the trade-off between accuracy and privacy. Finally, in an emerging ecosystem where tools for FA and DP are not yet well integrated, the dsPrivacy library will prove useful for researchers who want to explore privacy-friendly analysis methods.</p></sec></sec></body><back><ack><p>This work was supported by private funding from Roche. Apart from this, the authors declare that no funds, grants, or other support were received during the preparation of this manuscript.</p></ack><notes><sec><title>Data Availability</title><p>All generic source code has been made available as open source in the dsPrivacy and is available on Arkhn GitHub organization. Specific code to reproduce the study will be made available upon reasonable request to the corresponding author. The data underlying this article cannot be made publicly available due to the privacy of the patients involved in this study.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CSRF</term><def><p>Cross-Site Request Forgery</p></def></def-item><def-item><term id="abb2">DARAH</term><def><p> Distributed Analytics for Research in Hospitals</p></def></def-item><def-item><term id="abb3">DataSHIELD</term><def><p>Data aggregation through anonymous summary-statistics from harmonized individual-level databases</p></def></def-item><def-item><term id="abb4">DP</term><def><p> differential privacy</p></def></def-item><def-item><term id="abb5">FA</term><def><p> federated analytics</p></def></def-item><def-item><term id="abb6">FHIR</term><def><p>Fast Healthcare Interoperability Resources</p></def></def-item><def-item><term id="abb7">ISO</term><def><p>International Organization for Standardization</p></def></def-item><def-item><term id="abb8">OMOP</term><def><p>Observational Medical Outcomes Partnership</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rieke</surname><given-names>N</given-names> </name><name name-style="western"><surname>Hancox</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>W</given-names> </name><etal/></person-group><article-title>The future of digital health with federated learning</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><fpage>119</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-00323-1</pub-id><pub-id pub-id-type="medline">33015372</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gaye</surname><given-names>A</given-names> </name><name name-style="western"><surname>Marcon</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Isaeva</surname><given-names>J</given-names> </name><etal/></person-group><article-title>DataSHIELD: taking the analysis to the data, not the data to the analysis</article-title><source>Int J Epidemiol</source><year>2014</year><month>12</month><volume>43</volume><issue>6</issue><fpage>1929</fpage><lpage>1944</lpage><pub-id pub-id-type="doi">10.1093/ije/dyu188</pub-id><pub-id pub-id-type="medline">25261970</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jaddoe</surname><given-names>VWV</given-names> </name><name name-style="western"><surname>Felix</surname><given-names>JF</given-names> </name><name name-style="western"><surname>Andersen</surname><given-names>AMN</given-names> </name><etal/></person-group><article-title>The LifeCycle Project-EU Child Cohort Network: a federated analysis infrastructure and harmonized data of more than 250,000 children and parents</article-title><source>Eur J Epidemiol</source><year>2020</year><month>07</month><volume>35</volume><issue>7</issue><fpage>709</fpage><lpage>724</lpage><pub-id pub-id-type="doi">10.1007/s10654-020-00662-z</pub-id><pub-id pub-id-type="medline">32705500</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Prokosch</surname><given-names>HU</given-names> </name><name name-style="western"><surname>Acker</surname><given-names>T</given-names> </name><name name-style="western"><surname>Bernarding</surname><given-names>J</given-names> </name><etal/></person-group><article-title>MIRACUM: Medical Informatics in Research and Care in University Medicine</article-title><source>Methods Inf Med</source><year>2018</year><month>07</month><volume>57</volume><issue>S 01</issue><fpage>e82</fpage><lpage>e91</lpage><pub-id pub-id-type="doi">10.3414/ME17-02-0025</pub-id><pub-id pub-id-type="medline">30016814</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gruendner</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wolf</surname><given-names>N</given-names> </name><name name-style="western"><surname>T&#x00F6;gel</surname><given-names>L</given-names> </name><name name-style="western"><surname>Haller</surname><given-names>F</given-names> </name><name name-style="western"><surname>Prokosch</surname><given-names>HU</given-names> </name><name name-style="western"><surname>Christoph</surname><given-names>J</given-names> </name></person-group><article-title>Integrating Genomics and Clinical Data for Statistical Analysis by Using GEnome MINIng (GEMINI) and Fast Healthcare Interoperability Resources (FHIR): system design and implementation</article-title><source>J Med Internet Res</source><year>2020</year><month>10</month><day>7</day><volume>22</volume><issue>10</issue><fpage>e19879</fpage><pub-id pub-id-type="doi">10.2196/19879</pub-id><pub-id pub-id-type="medline">33026356</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Shokri</surname><given-names>R</given-names> </name><name name-style="western"><surname>Stronati</surname><given-names>M</given-names> </name><name name-style="western"><surname>Song</surname><given-names>C</given-names> </name><name name-style="western"><surname>Shmatikov</surname><given-names>V</given-names> </name></person-group><article-title>Membership inference attacks against machine learning models</article-title><conf-name>2017 IEEE Symposium on Security and Privacy (SP)</conf-name><conf-date>May 22-24, 2017</conf-date><conf-loc>San Jose, CA, USA</conf-loc><fpage>3</fpage><lpage>18</lpage><pub-id pub-id-type="doi">10.1109/SP.2017.41</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Melis</surname><given-names>L</given-names> </name><name name-style="western"><surname>Song</surname><given-names>C</given-names> </name><name name-style="western"><surname>De Cristofaro</surname><given-names>E</given-names> </name><name name-style="western"><surname>Shmatikov</surname><given-names>V</given-names> </name></person-group><article-title>Exploiting unintended feature leakage in collaborative learning</article-title><conf-name>2019 IEEE Symposium on Security and Privacy (SP)</conf-name><conf-date>May 19-23, 2019</conf-date><conf-loc>San Francisco, CA, USA</conf-loc><publisher-name>IEEE</publisher-name><fpage>691</fpage><lpage>706</lpage><pub-id pub-id-type="doi">10.1109/SP.2019.00029</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Dwork</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Our data, ourselves: privacy via distributed noise generation</article-title><conf-name>Advances in Cryptology-EUROCRYPT 2006: 24th Annual International Conference on the Theory and Applications of Cryptographic Techniques 2006</conf-name><conf-date>May 28, 2006</conf-date><pub-id pub-id-type="doi">10.1007/11761679_29</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dwork</surname><given-names>C</given-names> </name><name name-style="western"><surname>Roth</surname><given-names>A</given-names> </name></person-group><article-title>The algorithmic foundations of differential privacy</article-title><source>FNT in Theoretical Computer Science</source><year>2014</year><volume>9</volume><issue>3-4</issue><fpage>211</fpage><lpage>407</lpage><pub-id pub-id-type="doi">10.1561/0400000042</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="web"><article-title>Google/differential-privacy</article-title><source>GitHub</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/google/differential-privacy">https://github.com/google/differential-privacy</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="web"><article-title>OpenMined/pydp</article-title><source>GitHub</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/OpenMined/PyDP">https://github.com/OpenMined/PyDP</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><article-title>Opendp/opendp</article-title><source>GitHub</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/opendp/opendp">https://github.com/opendp/opendp</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="web"><article-title>Brubinstein/diffpriv</article-title><source>GitHub</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/brubinstein/diffpriv">https://github.com/brubinstein/diffpriv</ext-link></comment></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Alvim</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Andr&#x00E9;s</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Chatzikokolakis</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Differential privacy: on the trade-off between utility and information leakage</article-title><conf-name>Formal Aspects of Security and Trust</conf-name><conf-date>Aug 25, 2011</conf-date><fpage>39</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.1007/978-3-642-29420-4_3</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Hsu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gaboardi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Haeberlen</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Differential privacy: an economic method for choosing epsilon</article-title><conf-name>2014 IEEE 27th Computer Security Foundations Symposium (CSF)</conf-name><conf-date>Jul 19-22, 2014</conf-date><conf-loc>Vienna</conf-loc><pub-id pub-id-type="doi">10.1109/CSF.2014.35</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><article-title>Welcome to FHIR</article-title><source>HL7 FHIR</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://build.fhir.org/ig/InstitutNationalduCancer/ImplementationGuide_OsirisFHIR/branches/">https://build.fhir.org/ig/InstitutNationalduCancer/ImplementationGuide_OsirisFHIR/branches/</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="web"><article-title>Minimal common oncology data elements (mcode) implementation guide</article-title><source>HL7 FHIR</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://build.fhir.org/ig/HL7/fhir-mCODE-ig/">https://build.fhir.org/ig/HL7/fhir-mCODE-ig/</ext-link></comment></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><article-title>Differentially private contingency table</article-title><source>R Documentation</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://search.r-project.org/CRAN/refmans/DPpack/html/tableDP.html">https://search.r-project.org/CRAN/refmans/DPpack/html/tableDP.html</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><article-title>Opalr: &#x201C;Opal&#x201D; data repository client and &#x201C;datashield&#x201D; utils</article-title><source>CRAN: Package opalr</source><year>2024</year><access-date>2025-06-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/web/packages/opalr/index.html">https://cran.r-project.org/web/packages/opalr/index.html</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Belenkaya</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gurley</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Golozar</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Extending the OMOP common data model and standardized vocabularies to support observational cancer research</article-title><source>JCO Clin Cancer Inform</source><year>2021</year><month>01</month><volume>5</volume><fpage>12</fpage><lpage>20</lpage><pub-id pub-id-type="doi">10.1200/CCI.20.00079</pub-id><pub-id pub-id-type="medline">33411620</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><article-title>OHDSI/oncologywg</article-title><source>GitHub</source><access-date>2023-11-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/OHDSI/OncologyWG/wiki">https://github.com/OHDSI/OncologyWG/wiki</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Clifton</surname><given-names>C</given-names> </name></person-group><article-title>How much is enough? choosing &#x03B5; for differential privacy</article-title><conf-name>Information Security: 14th International Conference, ISC 2011:325&#x2013;40</conf-name><conf-date>Oct 26-29, 2011</conf-date><pub-id pub-id-type="doi">10.1007/978-3-642-24861-0_22</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Bonawitz</surname><given-names>K</given-names> </name><name name-style="western"><surname>Ivanov</surname><given-names>V</given-names> </name><name name-style="western"><surname>Kreuter</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Practical secure aggregation for federated learning on user-held data</article-title><source>arXiv</source><access-date>2023-11-29</access-date><comment>Preprint posted online on 2016</comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Beaver</surname><given-names>D</given-names> </name></person-group><article-title>Efficient multiparty protocols using circuit randomization</article-title><conf-name>Advances in Cryptology &#x2014; CRYPTO &#x2019;91</conf-name><conf-date>Aug 11-15, 1991</conf-date><fpage>420</fpage><lpage>432</lpage><pub-id pub-id-type="doi">10.1007/3-540-46766-1_34</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Paillier</surname><given-names>P</given-names> </name></person-group><article-title>Public-key cryptosystems based on composite degree residuosity classes</article-title><conf-name>Advances in Cryptology &#x2014; EUROCRYPT &#x2019;99</conf-name><conf-date>May 2-6, 1999</conf-date><fpage>223</fpage><lpage>238</lpage><pub-id pub-id-type="doi">10.1007/3-540-48910-X_16</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Boneh</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sahai</surname><given-names>A</given-names> </name><name name-style="western"><surname>Waters</surname><given-names>B</given-names> </name></person-group><article-title>Functional encryption: definitions and challenges</article-title><conf-name>Theory of Cryptography</conf-name><conf-date>Mar 28-30, 2011</conf-date><fpage>253</fpage><lpage>273</lpage><pub-id pub-id-type="doi">10.1007/978-3-642-19571-6_16</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Mironov</surname><given-names>I</given-names> </name></person-group><article-title>R&#x00E9;nyi differential privacy</article-title><conf-name>2017 IEEE 30th Computer Security Foundations Symposium (CSF)</conf-name><conf-date>Aug 21-25, 2017</conf-date><conf-loc>Santa Barbara, CA</conf-loc><pub-id pub-id-type="doi">10.1109/CSF.2017.11</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Kairouz</surname><given-names>P</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Viswanath</surname><given-names>P</given-names> </name></person-group><year>2015</year><conf-name>International conference on machine learning</conf-name><conf-date>Jul 13-19, 2015</conf-date><pub-id pub-id-type="doi">10.1109/TIT.2017.2685505</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>List of treatments of interest and their category.</p><media xlink:href="medinform_v13i1e59685_app1.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Correspondence between the variables of interest used in the dataset and the FHIR (Fast Healthcare Interoperability Resources) attributes.</p><media xlink:href="medinform_v13i1e59685_app2.docx" xlink:title="DOCX File, 16 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Data model to standardize data from centers in tabularized FHIR (Fast Healthcare Interoperability Resources) standard.</p><media xlink:href="medinform_v13i1e59685_app3.docx" xlink:title="DOCX File, 85 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Combined univariate analyses across all centers without and with differential privacy.</p><media xlink:href="medinform_v13i1e59685_app4.docx" xlink:title="DOCX File, 20 KB"/></supplementary-material></app-group></back></article>