<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e64114</article-id><article-id pub-id-type="doi">10.2196/64114</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Real-Time, Risk-Based Clinical Trial Quality Management in China: Development of a Digital Monitoring Platform</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Jiang</surname><given-names>Min</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhao</surname><given-names>Shuhua</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mei</surname><given-names>Yun</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fu</surname><given-names>Zhiying</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Yannan</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ai</surname><given-names>Jie</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sheng</surname><given-names>Yuan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gong</surname><given-names>Ying</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Jingjing</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>State Key Laboratory of Holistic Integrative Management of Gastrointestinal Cancers, Beijing Key Laboratory of Carcinogenesis and Translational Research, National Drug Clinical Trial Center, Peking University Cancer Hospital &#x0026; Institute</institution><addr-line>52 Fucheng Rd, Haidian District</addr-line><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff2"><institution>Key Laboratory of Carcinogenesis and Translational Research (Ministry of Education/Beijing), National Drug Clinical Trial Center, Peking University Cancer Hospital &#x0026; Institute</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff3"><institution>Yidu Cloud (Beijing) Technology Co, Ltd</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff4"><institution>Pfizer (China) Research and Development Co, Ltd</institution><addr-line>Shanghai</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Yao</surname><given-names>Chen</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Mainprize</surname><given-names>James G</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Min Jiang, MSc, State Key Laboratory of Holistic Integrative Management of Gastrointestinal Cancers, Beijing Key Laboratory of Carcinogenesis and Translational Research, National Drug Clinical Trial Center, Peking University Cancer Hospital &#x0026; Institute, 52 Fucheng Rd, Haidian District, Beijing, China, 86 01088196664; <email>gcp_jiangm@bjcancer.org.cn</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>25</day><month>4</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e64114</elocation-id><history><date date-type="received"><day>12</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>06</day><month>02</month><year>2025</year></date><date date-type="accepted"><day>08</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Min Jiang, Shuhua Zhao, Yun Mei, Zhiying Fu, Yannan Yuan, Jie Ai, Yuan Sheng, Ying Gong, Jingjing Chen. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 25.4.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e64114"/><abstract><sec><title>Background</title><p>With the improvement of the drug evaluation system in China, an increasing number of clinical trials have been launched in Chinese hospitals. However, traditional clinical trial quality management models largely rely on human monitoring and counting, which can be time-consuming and are likely to generate errors and biases. There is an urgent need to upgrade and improve the efficiency and accuracy of clinical trial quality monitoring systems in hospital-based research institutions within China.</p></sec><sec><title>Objective</title><p>The objective of this study was to develop a digital monitoring platform that allows for the real-time monitoring and detection of risk points and provides warnings about risk points throughout the entire life cycle of clinical trials, on the basis of historical clinical trial quality control (QC) findings.</p></sec><sec sec-type="methods"><title>Methods</title><p>Leveraging the risk-based quality management mindset, we built a digital dynamic monitoring platform by using big data analysis and automatic quantitative technology. Data from clinical trial QC reports generated during 2019 to 2023 in Beijing University Cancer Hospital, China, were used to train the automated classification tool, establish warning thresholds, and validate threshold values. Quality findings from the early-stage, interim-stage, and conclusion-stage QC rounds of clinical trials were rated by using 3 severity grades (minor, major, or critical) and classified into 5 categories (with 4 taxonomy levels under each category). QC report text was processed by using an automated natural language processing tool. All QC reports were grouped into 2 clusters via hierarchical clustering analysis. QC findings from the relatively high-risk cluster (reports that were more likely to have major and critical findings, as determined by experienced QC analysts) were used to determine warning threshold values for the monitoring platform (ie, the lowest number of findings was set as the threshold value for each specific study stage, Level-3 taxonomy, and severity grade combination).</p></sec><sec sec-type="results"><title>Results</title><p>The most frequently reported Level-3 taxonomies in QC reports from 2019 to 2022 were &#x201C;Standard Procedure and Process,&#x201D; &#x201C;Safety Reporting,&#x201D; and &#x201C;Source Data Collection and/or Recording.&#x201D; In total, 189 warning threshold values were established based on data from 1380 QC reports generated during 2019 to 2022, covering 3 severity grades, 21 Level-3 taxonomies, and 3 QC rounds. The warning thresholds were applied to 211 QC reports generated in 2023, of which 19.9% (n=42) triggered warnings. Similar patterns of QC findings, including the most frequently noted Level-3 QC findings, were observed between reports generated in 2023 and those from 2019 to 2022.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>In clinical practice, our tool would enable the automated monitoring and detection of risk points throughout all clinical trial stages; accurately identify the most relevant trial procedure and function line; and notify quality management personnel, in real time, to take prompt actions and dynamically prevent the recurrence of quality issues.</p></sec></abstract><kwd-group><kwd>clinical trial</kwd><kwd>quality control</kwd><kwd>risk-based quality management</kwd><kwd>digital</kwd><kwd>natural language processing</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Over the past 20 years, with the improvement of the drug evaluation system and standards in China, an increasing number of domestic and cross-national multicenter clinical trials have been launched in Chinese hospitals. However, in many hospital-based clinical trial institutions, traditional quality management models largely rely on human monitoring and counting, which not only require a lot of time and resources but also likely result in errors and biases. Therefore, such models may not be able to identify risk points and trends in a timely manner or prevent the recurrence of quality issues. In the face of the increasing number and complexity of clinical trials, the optimization of quality management models has become an urgent need for clinical trial institutions in Chinese hospitals.</p><p>Risk-based quality management (RBQM)&#x2014;recommended in guidelines issued by the US Food and Drug Administration [<xref ref-type="bibr" rid="ref1">1</xref>] and European Medicines Agency [<xref ref-type="bibr" rid="ref2">2</xref>] in 2013, as well as in the International Council for Harmonisation of Technical Requirements for Pharmaceuticals for Human Use (ICH) guidelines for good clinical practice in 2016 [<xref ref-type="bibr" rid="ref3">3</xref>]&#x2014;is a powerful approach that has been explored and applied in a growing number of trials and institutions [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. In 2020, the China National Medical Products Administration introduced the concept of RBQM into Chinese trial quality management systems [<xref ref-type="bibr" rid="ref6">6</xref>]. In 2022, the China Center for Drug Evaluation released Statistical Principles for Centralized Monitoring of Drug Clinical Trials, which was considered a milestone in China&#x2019;s clinical trial revolution and a guideline for the improvement and implementation of RBQM in China&#x2019;s clinical practice [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>To meet the urgent need for upgrading quality management models and achieving better efficiency, accuracy, and timeliness, we leveraged the RBQM mindset and used a long-term collection of quality management data from clinical trial programs in Beijing University Cancer Hospital, China, to build a digital dynamic monitoring platform via big data analysis and automatic quantitative technology. Through this platform, we aim to dynamically and prospectively monitor the entire life cycle of clinical trials and efficiently identify, intervene with, and systematically prevent quality risks that might compromise critical trial processes, patient safety, or data integrity.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This study was based on the processing and analysis of quality control (QC) documents from a large number of clinical trials, which underwent their own ethics reviews. Further, the text of the QC findings did not contain personal information of trial participants. As such, this study did not require ethics board review.</p></sec><sec id="s2-2"><title>Materials</title><p>A total of 1591 QC reports were generated in our institution from January 2019 to September 2023, involving 993 clinical trials. In accordance with relevant quality management standard operating procedures, a specific QC group was responsible for conducting at least 3 rounds of routine QC for each trial, including but not limited to (1) an early-stage QC round at the time point of achieving 5 enrollments or at 3 months after trial initiation, (2) an interim-stage QC round once every 6 months or when the trial achieved 20 enrollments, and (3) a conclusion-stage QC round at the time of site closeout. A detailed QC report was generated for each QC round, recording all quality issues. To build a digital monitoring platform, 1380 reports, which were generated during 2019 to 2022, served as the foundation for automated quantitative processing and the identification of warning thresholds, while the remaining 211 reports, which were generated in the year 2023, were used for testing the effectiveness of those thresholds in identifying high-risk trials.</p></sec><sec id="s2-3"><title>Classification of QC Findings</title><p>Findings from the routine QC reports were rated by using 3 severity grades (minor, major, or critical) and classified into 5 categories (&#x201C;Data,&#x201D; &#x201C;Quality,&#x201D; &#x201C;Safety and Ethics,&#x201D; &#x201C;Equipment and Facility,&#x201D; or &#x201C;Finance&#x201D;), with 4 taxonomy levels under each category. The severity ratings and Level-1 to Level-3 taxonomies would allow for an overall review and trend analysis, while the Level-4 taxonomies were designed to trace back precisely to the corresponding clinical trial procedure and personnel.</p></sec><sec id="s2-4"><title>Novel Automated Classification Tool</title><p>To enable the automated classification of QC findings, we developed a natural language processing (NLP) algorithm based on the Local Interpretable Model-Agnostic Explanations framework, which was implemented in Python. This algorithm was designed to perform multidimensional classifications of events in QC report texts (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Algorithm classification tool flowchart. QC: quality control.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64114_fig01.png"/></fig><p>The dataset used to develop the NLP algorithm comprised 1380 QC reports that were generated during 2019 to 2022; an average of 345 reports were generated per year. Among QC findings from these reports, 55.48% were categorized as minor findings, 42.23% were categorized as major findings, and 2.29% were categorized as critical findings. The word count of the reports ranged from 1619 to 17,367 words, with a median word count of 5938 (IQR 4453-7422) words per report. Data were stratified and split into training, validation, and testing sets (70%, 15%, and 15%, respectively) to ensure balanced class representation. Annotation rules covered 4 entity dimensions and 54 issue categories, which were derived from industry standards and refined through discussions with an internal expert team.</p><p>In the first phase, the dataset was annotated by using multidimensional information labeling rules, generating high-quality training data. In the second phase, natural text from QC reports was subjected to preliminary automated classification via a Bayesian network, which determined the Level-1 to Level-3 classifications for each text segment based on joint probability. Additionally, semantic role labeling&#x2014;a critical step in the classification NLP tool&#x2014;was used to identify the predicate-argument structure of each sentence [<xref ref-type="bibr" rid="ref8">8</xref>]. After training with the dataset, an explainable directed acyclic graph was constructed [<xref ref-type="bibr" rid="ref9">9</xref>]. In the directed acyclic graph, graph neural networks were used to propagate information across the graph, forming an algorithmic model capable of capturing events. The model achieved precision (P) and recall (R) scores &#x003E;0.95. In the third phase, by using the trained model, events were extracted from the QC report text and subjected to Bayesian inference. If an inference could be drawn from the graph, automatic classification was completed; if no inference could be made, a new branch was created, and the entire graph model was updated and iterated. The final Level-4 classification results were represented as the terminal leaf nodes in the graph.</p></sec><sec id="s2-5"><title>Clustering</title><p>After all findings from QC reports were classified by using our automated classification tool, a dataset was created based on the incidence rates of different categories of QC findings from each QC report. Using SPSS for Windows 20.0 (IBM Corp), hierarchical clustering analysis was applied to this dataset to ensure that reports with similar patterns of QC findings were grouped into the same cluster: each report was initially treated as a separate cluster; then, the algorithm identified 2 clusters that were closest to each other (ie, clusters with maximum similarity) and merged these 2 clusters into 1 new cluster. These steps were repeated until all QC reports were grouped into 2 clusters (Cluster I and Cluster II). A dendrogram was generated, showing the levels of similarity and dissimilarity between QC reports. Per manual interpretation by a group of experienced QC analysts, Cluster II was identified as high risk (ie, reports with more findings or a higher proportion of major and critical findings), and Cluster I was considered relatively &#x201C;normal&#x201D; (reports with less findings or a higher proportion of minor findings).</p></sec><sec id="s2-6"><title>Establishment of Warning Thresholds and Detection of Risk Points</title><p>Warning thresholds were established based on the high-risk (Cluster II) QC reports from 2019 to 2022; the lowest number of findings was set as the threshold value for a specific study stage, Level-3 taxonomy, and severity grade combination. For example, a threshold value of X was set for the following combination: early-stage QC round, Level-3 taxonomy &#x201C;Biological Sample Management,&#x201D; and major findings; this made sure that all high-risk QC reports from early-stage QC rounds had at least X major findings under the Level-3 taxonomy &#x201C;Biological Sample Management.&#x201D; The warning thresholds were then applied to QC reports from 2023; these warning thresholds would help with determining the risk points (ie, the most commonly reported findings) and investigating the root causes of findings.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Summary of 2019 to 2022 QC Findings</title><p>From 2019 to 2022, the proportion of major or critical findings generally decreased each year (major findings showed a 1.27-fold decrease, and critical findings showed a 3-fold decrease), even during the COVID-19 pandemic, while the proportion of minor findings showed an approximately 1.24-fold increase over the 4 years (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Proportion of quality control findings under 3 categories of clinical significance and severity.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64114_fig02.png"/></fig><p>It was consistently observed during each year that the most commonly reported Level-3 taxonomies (the proportions of findings for these taxonomies were &#x003E;5%), in decreasing order of frequency, were (1) &#x201C;Standard Procedure and Process,&#x201D; (2) &#x201C;Safety Reporting,&#x201D; (3) &#x201C;Source Data Collection and/or Recording,&#x201D; (4) &#x201C;Investigational Product,&#x201D; (5) &#x201C;Personnel Qualification and Training,&#x201D; and (6) &#x201C;Biological Sample Management&#x201D; (<xref ref-type="table" rid="table1">Table 1</xref>). In 2020, under the influence of the COVID-19 pandemic, increases were observed in the average numbers of findings per report that fell under these Level-3 taxonomies, but 2 years later, the average numbers of these findings dropped back to their 2019 levels (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Proportion of quality control (QC) findings under each Level-3 taxonomy from 2019 to 2023.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Level-3 classification</td><td align="left" valign="bottom">2019 (% of QC findings)</td><td align="left" valign="bottom">2020 (% of QC findings)</td><td align="left" valign="bottom">2021 (% of QC findings)</td><td align="left" valign="bottom">2022 (% of QC findings)</td><td align="left" valign="bottom">2023 (% of QC findings)</td></tr></thead><tbody><tr><td align="left" valign="top">Source Data Collection and/or Recording</td><td align="left" valign="top">13.62</td><td align="left" valign="top">13.65</td><td align="left" valign="top">13.75</td><td align="left" valign="top">13.53</td><td align="left" valign="top">13.61</td></tr><tr><td align="left" valign="top">Source Data Modification/Correction</td><td align="left" valign="top">0.62</td><td align="left" valign="top">0.41</td><td align="left" valign="top">0.23</td><td align="left" valign="top">0.31</td><td align="left" valign="top">0.44</td></tr><tr><td align="left" valign="top">Source Data Transcription</td><td align="left" valign="top">0.74</td><td align="left" valign="top">0.72</td><td align="left" valign="top">0.56</td><td align="left" valign="top">0.70</td><td align="left" valign="top">0.73</td></tr><tr><td align="left" valign="top">Process Documentation Management</td><td align="left" valign="top">0.08</td><td align="left" valign="top">0.07</td><td align="left" valign="top">0.08</td><td align="left" valign="top">0.09</td><td align="left" valign="top">0.08</td></tr><tr><td align="left" valign="top">Standard Procedure and Process</td><td align="left" valign="top">26.47</td><td align="left" valign="top">27.14</td><td align="left" valign="top">27.95</td><td align="left" valign="top">26.91</td><td align="left" valign="top">26.97</td></tr><tr><td align="left" valign="top">Personnel Qualification and Training</td><td align="left" valign="top">9.21</td><td align="left" valign="top">8.02</td><td align="left" valign="top">7.81</td><td align="left" valign="top">9.02</td><td align="left" valign="top">9.09</td></tr><tr><td align="left" valign="top">Query Identification</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Query Recording and Reporting</td><td align="left" valign="top">0.51</td><td align="left" valign="top">0.27</td><td align="left" valign="top">0.36</td><td align="left" valign="top">0.27</td><td align="left" valign="top">0.58</td></tr><tr><td align="left" valign="top">Query Prevention</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Laboratory, Equipment, Facility, and Supply Management</td><td align="left" valign="top">1.20</td><td align="left" valign="top">1.29</td><td align="left" valign="top">1.55</td><td align="left" valign="top">1.28</td><td align="left" valign="top">1.23</td></tr><tr><td align="left" valign="top">Biological Sample Management</td><td align="left" valign="top">5.58</td><td align="left" valign="top">5.72</td><td align="left" valign="top">6.35</td><td align="left" valign="top">5.88</td><td align="left" valign="top">5.59</td></tr><tr><td align="left" valign="top">Clinical Trial Document Management</td><td align="left" valign="top">3.98</td><td align="left" valign="top">4.21</td><td align="left" valign="top">4.35</td><td align="left" valign="top">4.07</td><td align="left" valign="top">4.09</td></tr><tr><td align="left" valign="top">Human Genetic Resource Management</td><td align="left" valign="top">0.23</td><td align="left" valign="top">0.19</td><td align="left" valign="top">0.17</td><td align="left" valign="top">0.24</td><td align="left" valign="top">0.24</td></tr><tr><td align="left" valign="top">Informed Consent Personnel Qualifications</td><td align="left" valign="top">1.40</td><td align="left" valign="top">1.22</td><td align="left" valign="top">1.59</td><td align="left" valign="top">1.50</td><td align="left" valign="top">1.48</td></tr><tr><td align="left" valign="top">Informed Consent Process</td><td align="left" valign="top">2.29</td><td align="left" valign="top">2.23</td><td align="left" valign="top">2.37</td><td align="left" valign="top">2.47</td><td align="left" valign="top">2.39</td></tr><tr><td align="left" valign="top">Ethics Committee Composition and Operation</td><td align="left" valign="top">1.17</td><td align="left" valign="top">1.70</td><td align="left" valign="top">1.34</td><td align="left" valign="top">1.53</td><td align="left" valign="top">1.23</td></tr><tr><td align="left" valign="top">Safety Reporting</td><td align="left" valign="top">16.50</td><td align="left" valign="top">16.97</td><td align="left" valign="top">15.79</td><td align="left" valign="top">15.94</td><td align="left" valign="top">15.98</td></tr><tr><td align="left" valign="top">Concomitant Medications</td><td align="left" valign="top">3.34</td><td align="left" valign="top">3.18</td><td align="left" valign="top">2.91</td><td align="left" valign="top">2.98</td><td align="left" valign="top">3.19</td></tr><tr><td align="left" valign="top">Investigational Product</td><td align="left" valign="top">11.52</td><td align="left" valign="top">11.43</td><td align="left" valign="top">11.50</td><td align="left" valign="top">11.76</td><td align="left" valign="top">11.57</td></tr><tr><td align="left" valign="top">Inclusion and Exclusion Criteria</td><td align="left" valign="top">1.53</td><td align="left" valign="top">1.58</td><td align="left" valign="top">1.34</td><td align="left" valign="top">1.52</td><td align="left" valign="top">1.51</td></tr><tr><td align="left" valign="top">Clinical Trial Finance Process</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr></tbody></table></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Average number of findings per quality control report under the most frequently reported Level-3 taxonomies (proportions of findings for these taxonomies: &#x003E;5%).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64114_fig03.png"/></fig><p>Similar trends were also observed when QC findings were summarized under Level-4 taxonomies. A 1.41-fold increase in the average number of findings under the Level-4 taxonomy &#x201C;Adverse Event Assessment and Documentation&#x201D; was observed in 2020 when compared to 2019. Further, while the average number of findings under the Level-4 taxonomy &#x201C;Biological Sample Shipment and Recording&#x201D; was &#x2264;0.2 per report across each year, a 1.43-fold increase was also noted in 2020 when compared to the previous year. These trends were likely attributable to the outbreak of the COVID-19 pandemic. With the adaptive actions taken in response to COVID-19 (eg, implementation of digital monitoring), the numbers of QC findings under these two Level-4 taxonomies eventually dropped back to their 2019 levels (<xref ref-type="fig" rid="figure4">Figure 4</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Trends of change in average number of findings per quality control report under two Level-4 taxonomies from 2019 to 2022.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64114_fig04.png"/></fig></sec><sec id="s3-2"><title>Warning Thresholds and Warning-Triggering Risks in the Year 2023</title><p>A total of 189 warning threshold values were established to cover all 3 severity grades, 21 Level-3 taxonomies, and 3 rounds of QC (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). These thresholds were applied to a total of 211 QC reports generated in 2023. Among those reports, 42 triggered warnings, resulting in a trigger rate of 19.9%. Approximately half (n=23, 55%) of the 42 warning-triggering, high-risk reports were from interim-stage QC rounds, while 8 and 11 were from early-stage and conclusion-stage QC rounds, respectively.</p><p><xref ref-type="fig" rid="figure5">Figure 5</xref> presents data from 3 randomly selected reports from early-stage QC rounds as examples to show the number of major QC findings that exceeded or did not exceed the corresponding threshold value for each of the 21 Level-3 taxonomies.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Number of major QC findings under each Level-3 taxonomy from 3 early-stage QC reports, in comparison with corresponding threshold values. QC: quality control.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64114_fig05.png"/></fig><p>Among the 42 high-risk reports in 2023, after the application of warning threshold values, the most frequently noted Level-3 taxonomies with alarm-triggering QC findings were generally consistent with those observed in QC reports from 2019 to 2022 (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>, <xref ref-type="fig" rid="figure3">Figure 3</xref>). The most common alarm-triggering Level-3 taxonomy was &#x201C;Standard Procedure and Process,&#x201D; which was reported in 36% (15/42) of high-risk reports, and its most relevant process (ie, &#x201C;risk point,&#x201D; as defined by Level-4 taxonomies) was &#x201C;Protocol Deviation &#x2013; Deviation from Study Design,&#x201D; which was reported in 33% (5/15) of the reports that triggered an alarm for QC findings that fell under the Level-3 &#x201C;Standard Procedure and Process&#x201D; taxonomy. In response to Level-4 taxonomies that were more likely to cause alarm-triggering QC issues (<xref ref-type="table" rid="table2">Table 2</xref>), intervention strategies to be incorporated into routine clinical practice were proposed.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Most frequently reported Level-3 taxonomies in alarm-triggering quality control reports from 2023 (n=42) and their corresponding most relevant Level-4 taxonomies.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Level-3 taxonomy</td><td align="left" valign="bottom">Level-3 taxonomy incidence, number of reports (%)</td><td align="left" valign="bottom">Most relevant Level-4 taxonomy</td></tr></thead><tbody><tr><td align="left" valign="top">Standard Procedure and Process</td><td align="left" valign="top">15 (36)</td><td align="left" valign="top">Protocol Deviation &#x2013; Deviation From Study Design</td></tr><tr><td align="left" valign="top">Safety Reporting</td><td align="left" valign="top">8 (19)</td><td align="left" valign="top">Adverse Event Assessment and Documentation</td></tr><tr><td align="left" valign="top">Source Data Collection and/or Recording</td><td align="left" valign="top">8 (19)</td><td align="left" valign="top">Paper Source Data Files</td></tr><tr><td align="left" valign="top">Biological Sample Management</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">Biosample Transportation and Documentation</td></tr><tr><td align="left" valign="top">Personnel Qualification and Training</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">Personnel Authorization and Documentation</td></tr><tr><td align="left" valign="top">Investigational Product</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">Administration of Investigational Products and Associated Documentation Issues</td></tr><tr><td align="left" valign="top">Laboratory, Equipment, Facility, and Supply Management</td><td align="left" valign="top">4 (10)</td><td align="left" valign="top">Equipment Maintenance Issues</td></tr><tr><td align="left" valign="top">Clinical Trial Document Management</td><td align="left" valign="top">4 (10)</td><td align="left" valign="top">Clinical Trial Document Maintenance</td></tr><tr><td align="left" valign="top">Concomitant Medications</td><td align="left" valign="top">4 (10)</td><td align="left" valign="top">Concomitant Medications Record and Documentation</td></tr><tr><td align="left" valign="top">Informed Consent Process</td><td align="left" valign="top">3 (7)</td><td align="left" valign="top">Informed Consent Signing Issues</td></tr><tr><td align="left" valign="top">Process Documentation Management</td><td align="left" valign="top">3 (7)</td><td align="left" valign="top">Quality Control Documentation</td></tr><tr><td align="left" valign="top">Inclusion and Exclusion Criteria</td><td align="left" valign="top">2 (5)</td><td align="left" valign="top">Inclusion and Exclusion Criteria Documentation</td></tr><tr><td align="left" valign="top">Query Recording and Reporting</td><td align="left" valign="top">1 (2)</td><td align="left" valign="top">Incomplete Monitoring Records</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>As stated in the ICH E6(R3) guideline published in January 2025, clinical trial institutions and sponsors are encouraged to use innovative digital technologies to improve clinical trial quality, taking into consideration the risk factors that could potentially impact participant safety, data quality, and other key elements in clinical trial procedures [<xref ref-type="bibr" rid="ref3">3</xref>]. In this study, data from historical clinical trial QC reports generated in our hospital were standardized and classified for further risk-based qualitative analyses, and the minimum number of QC findings was determined as the threshold value for each QC stage, severity level, and Level-3 taxonomy combination. These QC warning thresholds were embedded into our digital dynamic monitoring platform to allow for the dynamic and proactive identification of high-risk QC reports and to notify quality management personnel, in a real-time manner, about which reports had a number of QC findings (ie, in a specific stage, severity level, and Level-3 taxonomy) that was larger than the corresponding threshold value. For example, a QC warning will be triggered for an early-stage QC report if it reports more than 13 minor findings, more than 3 major findings, or more than 2 critical findings under the Level-3 taxonomy &#x201C;Source Data Collection and/or Recording,&#x201D; requesting the quality management group to follow up and take actions.</p><p>With the help of the digital platform, the quality management team can quickly and accurately identify the relevant clinical trial procedure and function line for the reported quality issues and adopt mitigation strategies. For example, in QC reports from 2019 to 2022, &#x201C;Standard Procedure and Process&#x201D; was the most frequently reported Level-3 taxonomy for QC reports generated during the conclusion stage (ie, around the time of site closeout), and one-third (38/114, 33.3%) of the quality issues were attributed to participants&#x2019; poor compliance with safety visits after they left the trial site. Driven by this observation, we learned from participants that many of them lived far away from our trial site in Beijing, and after leaving the trial site, it was difficult for them to travel a long distance back to the trial site for additional safety follow-ups. Our proposed action is to allow participants who are discharged from the trial site to complete their follow-up visits in a local clinical trial center (ie, at or near their hometown) equipped with a remote visit system, as an approach to improving their compliance with the safety monitoring procedures. Another example is the quality alarm associated with the Level-4 taxonomy &#x201C;Administration of Investigational Products and Associated Documentation Issues.&#x201D; In a trial with QC findings that fell under this taxonomy, the study drug was to be orally self-administered at home, and a large proportion of participants missed multiple oral doses. In response to this finding, our proposed action is to send drug administration reminders via participants&#x2019; social networking platforms and the hospital&#x2019;s mobile app. The digital platform also enables the study team to conduct targeted source data verifications and reviews; the study team can also exempt a trial from complete source data verifications and reviews if it did not trigger any warnings.</p><p>The digital platform remains to be optimized for future clinical practice; the input of more QC data and an upgraded automated calculation tool are needed to enhance its accuracy and applicability. However, the concurrent use of other digital tools may further enhance the efficiency of quality management systems. For high-risk trials that have already triggered an alarm in the early- or interim-stage QC round, a remote monitoring system may help to reduce quality issues due to trial procedure noncompliance.</p></sec></body><back><ack><p>This study was supported by Beijing Natural Science Foundation (L232032) and Beijing Municipal Science &#x0026; Technology Commission No. Z231100004623006.</p></ack><fn-group><fn fn-type="con"><p>All of the listed authors reviewed, commented on, and approved the final draft of the manuscript. MJ and SZ designed and directed the project and made substantial contributions to data collection and interpretation; thus, they are listed as co&#x2013;first authors. YM designed the automated classification tool and conducted all data analyses, including but not limited to natural language processing and quality control report clustering. YG and JC coordinated and monitored the manuscript drafting process and contributed to the <italic>Introduction</italic> and <italic>Methods</italic> sections. YS provided manuscript writing support.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ICH</term><def><p>International Council for Harmonisation of Technical Requirements for Pharmaceuticals for Human Use</p></def></def-item><def-item><term id="abb2">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb3">QC</term><def><p>quality control</p></def></def-item><def-item><term id="abb4">RBQM</term><def><p>risk-based quality management</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Oversight of clinical investigations &#x2014; a risk-based approach to monitoring</article-title><source>U.S. Food and Drug Administration</source><year>2013</year><month>08</month><access-date>2024-07-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/oversight-clinical-investigations-risk-based-approach-monitoring">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/oversight-clinical-investigations-risk-based-approach-monitoring</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>Reflection paper on risk based quality management in clinical trials</article-title><source>European Medicines Agency</source><year>2013</year><month>11</month><day>18</day><access-date>2024-07-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ema.europa.eu/en/documents/scientific-guideline/reflection-paper-risk-based-quality-management-clinical-trials_en.pdf">https://www.ema.europa.eu/en/documents/scientific-guideline/reflection-paper-risk-based-quality-management-clinical-trials_en.pdf</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>ICH harmonised guideline: guideline for good clinical practice E6(R3)</article-title><source>International Council for Harmonisation of Technical Requirements for Pharmaceuticals for Human Use</source><access-date>2025-04-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://database.ich.org/sites/default/files/ICH_E6%28R3%29_Step4_FinalGuideline_2025_0106.pdf">https://database.ich.org/sites/default/files/ICH_E6%28R3%29_Step4_FinalGuideline_2025_0106.pdf</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stansbury</surname><given-names>N</given-names> </name><name name-style="western"><surname>Barnes</surname><given-names>B</given-names> </name><name name-style="western"><surname>Adams</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Risk-based monitoring in clinical trials: increased adoption throughout 2020</article-title><source>Ther Innov Regul Sci</source><year>2022</year><month>05</month><volume>56</volume><issue>3</issue><fpage>415</fpage><lpage>422</lpage><pub-id pub-id-type="doi">10.1007/s43441-022-00387-z</pub-id><pub-id pub-id-type="medline">35235192</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barnes</surname><given-names>B</given-names> </name><name name-style="western"><surname>Stansbury</surname><given-names>N</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Risk-based monitoring in clinical trials: past, present, and future</article-title><source>Ther Innov Regul Sci</source><year>2021</year><month>07</month><volume>55</volume><issue>4</issue><fpage>899</fpage><lpage>906</lpage><pub-id pub-id-type="doi">10.1007/s43441-021-00295-8</pub-id><pub-id pub-id-type="medline">33914298</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><article-title>&#x56FD;&#x5BB6;&#x836F;&#x76D1;&#x5C40; &#x56FD;&#x5BB6;&#x536B;&#x751F;&#x5065;&#x5EB7;&#x59D4; &#x5173;&#x4E8E;&#x53D1;&#x5E03;&#x836F;&#x7269;&#x4E34;&#x5E8A;&#x8BD5;&#x9A8C;&#x8D28;&#x91CF;&#x7BA1;&#x7406;&#x89C4;&#x8303;&#x7684;&#x516C;&#x544A; [Article in Chinese]</article-title><source>The State Council of the People&#x2019;s Republic of China</source><access-date>2025-04-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gov.cn/gongbao/content/2020/content_5525106.htm">https://www.gov.cn/gongbao/content/2020/content_5525106.htm</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="web"><article-title>&#x56FD;&#x5BB6;&#x836F;&#x76D1;&#x5C40;&#x836F;&#x5BA1;&#x4E2D;&#x5FC3;&#x5173;&#x4E8E;&#x53D1;&#x5E03;&#x300A;&#x836F;&#x7269;&#x4E34;&#x5E8A;&#x8BD5;&#x9A8C;&#x4E2D;&#x5FC3;&#x5316;&#x76D1;&#x67E5;&#x7EDF;&#x8BA1;&#x6307;&#x5BFC;&#x539F;&#x5219; (&#x8BD5;&#x884C;)&#x300B;&#x7684;&#x901A;&#x544A; (2022&#x5E74;&#x7B2C;11&#x53F7;) [Article in Chinese]</article-title><source>Center for Drug Evaluation, NMPA</source><access-date>2025-04-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cde.org.cn/main/news/viewInfoCommon/0a0ebbd5d09ec9fe6fcdc6e76d526314">https://www.cde.org.cn/main/news/viewInfoCommon/0a0ebbd5d09ec9fe6fcdc6e76d526314</ext-link></comment></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Marcheggiani</surname><given-names>D</given-names> </name><name name-style="western"><surname>Titov</surname><given-names>I</given-names> </name></person-group><article-title>Encoding sentences with graph convolutional networks for semantic role labeling</article-title><access-date>2025-03-31</access-date><conf-name>2017 Conference on Empirical Methods in Natural Language Processing</conf-name><conf-date>Sep 7-11, 2017</conf-date><conf-loc>Copenhagen, Denmark</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/D17-1159">https://aclanthology.org/D17-1159</ext-link></comment><pub-id pub-id-type="doi">10.18653/v1/D17-1159</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Shen</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Quan</surname><given-names>X</given-names> </name></person-group><article-title>Directed acyclic graph network for conversational emotion recognition</article-title><access-date>2025-03-31</access-date><conf-name>59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing</conf-name><conf-date>Aug 1-6, 2021</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/2021.acl-long.123">https://aclanthology.org/2021.acl-long.123</ext-link></comment><pub-id pub-id-type="doi">10.18653/v1/2021.acl-long.123</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Threshold values for Level-3 taxonomies in quality control (QC) across 3 study stages and 3 severity grades.</p><media xlink:href="medinform_v13i1e64114_app1.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material></app-group></back></article>